<?xml version="1.0" encoding="UTF-8"?>
<?xml-stylesheet type="text/xsl" media="screen" href="/~d/styles/atom10full.xsl"?><?xml-stylesheet type="text/css" media="screen" href="http://feeds.feedburner.com/~d/styles/itemcontent.css"?><feed xmlns="http://www.w3.org/2005/Atom" xmlns:openSearch="http://a9.com/-/spec/opensearch/1.1/" xmlns:georss="http://www.georss.org/georss" xmlns:gd="http://schemas.google.com/g/2005" xmlns:thr="http://purl.org/syndication/thread/1.0" xmlns:feedburner="http://rssnamespace.org/feedburner/ext/1.0" gd:etag="W/&quot;CUUMR3c-cSp7ImA9WhRUFUk.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050</id><updated>2012-01-25T18:01:26.959-08:00</updated><category term="Moses" /><category term="GALA" /><category term="Italy" /><category term="China" /><category term="statistical  MT" /><category term="global business" /><category term="collaboration" /><category term="localization" /><category term="Asia" /><category term="BLEU" /><category term="inspiration" /><category term="transcreation" /><category term="globalization" /><category term="censorship" /><category term="Google" /><category term="Information poverty" /><category term="Controlled Language" /><category term="information quality" /><category term="Internet trends" /><category term="translation technology" /><category term="MT" /><category term="innovation" /><category term="industry associations" /><category term="customer loyalty" /><category term="customer support" /><category term="standards" /><category term="AMTA" /><category term="customer care" /><category term="crowdsourcing" /><category term="Post-editing" /><category term="translation quality" /><category term="India" /><category term="SMT" /><category term="e-commerce opportunity" /><category term="conferences" /><category term="humor" /><title>eMpTy Pages</title><subtitle type="html">Comments about translation technology, localization and collaboration</subtitle><link rel="http://schemas.google.com/g/2005#feed" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/posts/default" /><link rel="alternate" type="text/html" href="http://kv-emptypages.blogspot.com/" /><link rel="next" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default?start-index=10&amp;max-results=9&amp;redirect=false&amp;v=2" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><generator version="7.00" uri="http://www.blogger.com">Blogger</generator><openSearch:totalResults>68</openSearch:totalResults><openSearch:startIndex>1</openSearch:startIndex><openSearch:itemsPerPage>9</openSearch:itemsPerPage><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="self" type="application/atom+xml" href="http://feeds.feedburner.com/EmptyPages" /><feedburner:info uri="emptypages" /><atom10:link xmlns:atom10="http://www.w3.org/2005/Atom" rel="hub" href="http://pubsubhubbub.appspot.com/" /><feedburner:emailServiceId>EmptyPages</feedburner:emailServiceId><feedburner:feedburnerHostname>http://feedburner.google.com</feedburner:feedburnerHostname><entry gd:etag="W/&quot;CUUDQXg-fSp7ImA9WhRUFU4.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-1117184695993454900</id><published>2012-01-25T15:01:00.000-08:00</published><updated>2012-01-25T15:14:30.655-08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-25T15:14:30.655-08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="translation quality" /><category scheme="http://www.blogger.com/atom/ns#" term="BLEU" /><category scheme="http://www.blogger.com/atom/ns#" term="SMT" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><title>A Short Guide to Measuring and Comparing Machine Translation Engines</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;img align="left" src="http://www.asiaonline.net/images/Quality.png" style="margin-top: 0px; padding-top: 0px;" /&gt;
                                        &lt;i&gt;This is an article from the Asia Online &lt;a href="http://www.asiaonline.net/newsletters/201111.htm"&gt;November 2011 Newsletter&lt;/a&gt; that provides useful advice for meaningful comparisons of&amp;nbsp; MT engines and is authored by Dion Wiggins, CEO of Asia Online. So the next time somebody promises you a BLEU of 60, be skeptical, and make sure you get the proper context and assurances that it was properly done.&lt;b&gt;&lt;br /&gt;&lt;/b&gt;&lt;/i&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;&lt;b&gt;“What is your &lt;a href="http://kv-emptypages.blogspot.com/2010/03/need-for-automated-quality-measurement.html"&gt;BLEU&lt;/a&gt; score?”&lt;/b&gt;&lt;/i&gt; This is the single most &lt;b&gt;&lt;i&gt;&lt;u&gt;irrelevant
                                            question&lt;/u&gt;&lt;/i&gt;&lt;/b&gt; relating to translation quality, yet one of the most frequently
                                        asked. BLEU scores and other translation quality metrics greatly depend on many
                                        factors that must be understood in order for a score to be meaningful. A BLEU score
                                        of 20 in some cases can be better than a BLEU score of 50 or vice versa. Without
                                        understanding how a test set was measured and other details such as language pair
                                        and domain complexity, a BLEU score without context is not much more than a meaningless number. &lt;i&gt;(For a primer on BLEU &lt;a href="http://kv-emptypages.blogspot.com/2010/03/need-for-automated-quality-measurement.html"&gt;look here&lt;/a&gt;.)&lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
                                        &lt;/span&gt;&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
BLEU scores and other translation quality metrics will vary based upon:&lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-left: -15px;"&gt;
&lt;li&gt;&lt;b&gt;The test set being measured:&lt;/b&gt;
 Different test sets will give very different
                                                scores. A test set that 
is out of domain will usually score lower than a test set
                                                that is in the domain of
 the translation engine being tested. The quality of the
                                                segments in the test set should be gold 
standard (i.e. validated as correct by humans). Lower quality test set data will give a less meaningful
                                                score.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;How many human reference translations were used:&lt;/b&gt;
 If there is more than one
                                                human reference 
translation, the resulting BLEU score will be higher as there are
                                                more opportunities for 
the machine translation to match part of the reference.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;The complexity of the language pair:&lt;/b&gt;
 Spanish is a simpler language in terms
                                                of grammar and structure
 than Finnish or Chinese relative to English. Typically if the source or target
                                                language is relatively more complex,&amp;nbsp; the BLEU score will be lower. &lt;/li&gt;
&lt;li&gt;&lt;b&gt;The complexity of the domain:&lt;/b&gt;
 A patent has far more complex text and structure
                                                than a children’s story 
book. Very different metric scores will be calculated based
                                                on the complexity of the
 domain. It is not practical to compare two different test
                                                sets and conclude that 
one translation engine is better than the other.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;The capitalization of the segments being measured:&lt;/b&gt;
 When comparing metrics,
                                                the most common form of 
measurement is Case Insensitive. However when publishing,
                                                Case Sensitive is also 
important and may also be measured.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;The measurement software:&lt;/b&gt;
 There are many measurement tools for translation
                                                quality. Each may vary 
slightly with respect to how a score is calculated, or the
                                                settings for the measure
 tools may not be set the same. The same measurement software
                                                should be used for all 
measurements. Asia Online provides&lt;a href="http://www.languagestudio.com/ToolsAndDownloads.aspx"&gt; Language Studio™                                                Pro free&lt;/a&gt; of charge and this software 
measures the scores, for a given test set, for a variety of quality metrics.&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
It is clear from the above list of variables that a BLEU score number by itself
                                            has no real meaning.
                                        &lt;/div&gt;
&lt;div style="color: #9f1111; font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: 14px; font-weight: bold; padding-right: 3px; padding-top: 10px;"&gt;
How BLEU scores and other translation metrics are measured&lt;/div&gt;
&lt;div style="text-align: center;"&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
                                        &lt;/span&gt;&lt;img src="http://www.asiaonline.net/images/Newsletter/HowTestSetsAreMeasured510.png" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;" /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
With BLEU scores, a higher 
score indicates higher quality. A BLEU score is not a
                                            linear metric. A 2 BLEU 
point increase from 20 to 22 will be considerably more noticeable
                                            than the same increase from 
50 to 52. F-Measure and METEOR also work in this manner
                                            where a higher score is also
 better. For Translation Error Rate (TER), a lower score
                                            is a better score. Language 
Studio™ Pro supports all of these metrics and
                                            can be &lt;a href="http://www.languagestudio.com/ToolsAndDownloads.aspx"&gt;downloaded for free&lt;/a&gt;.
                                        &lt;/div&gt;
&lt;div style="color: #9f1111; font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: 14px; font-weight: bold; padding-top: 10px;"&gt;
Basic Test Set Criteria Checklist&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-top: 0px; padding-top: 0px; text-align: justify;"&gt;
The criteria specified by this checklist are absolute. Not complying with any of
                                            the checklist items will result in a score that is unreliable and less meaningful.&lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-left: -15px;"&gt;
&lt;li&gt;&lt;b&gt;Test Set Data should be very high quality:&lt;/b&gt; If the test set data are of low
                                                quality, then the measurement delivered will not be reliable.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Test set should be in domain: &lt;/b&gt;The test set should represent the type of information
                                                that you are going to translate. The domain, writing style and vocabulary should
                                                be representative of what you intend to translate. Testing on out-of-domain text
                                                will not result in a useful metric.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Test Set Data &lt;u&gt;must not&lt;/u&gt; be included in the training Data:&lt;/b&gt;
 If you are
                                                creating an SMT engine, 
then you must make sure that the data you are testing with
                                                or very similar data are
 not in the data that the engine was trained with. If the
                                                test data are in the 
training data the scores will be artificially high and will
                                                not represent the level of quality that will be output when other "blind" data are
                                                translated.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Test Set Data should be data that can be translated: &lt;/b&gt;Test
 set segments should
                                                have a minimal amount of
 dates, times, numbers and names. While a valid part a segment,
                                                they are not parts of 
the segment that are translated; they are usually transformed
                                                or mapped. The focus for a
 test set should be on words that are to be translated.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Test Set Data should have segments that are at between 8 and 15 words in length:&lt;/b&gt;
                                                Short segments will 
artificially raise the quality scores as most metrics do not
                                                take into account 
segment length. Short segments are more likely to get a perfect
                                                match of the entire 
phrase, which is not a translation and is more like 100% match
                                                with a translation 
memory. The longer the segment, the more opportunity there is
                                                for variations on what 
is being translated. This will result in artificially lower
                                                scores, even if the 
translation is good. A small number of segments shorter than
                                                8 words or longer than 
15 words are acceptable, but these should be limited.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Test set should be at least 1,000 segments: &lt;/b&gt;While
 it is possible to get a
                                                metric from shorter test
 sets, a reasonable statistic representation of the metric
                                                can only be created when
 there are sufficient segments to build statistics from.
                                                When there are only a 
low number of segments, small anomalies in one or two segments
                                                can raise or reduce the 
test set score artificially.Be skeptical of scores from test sets that only contain a few hundred sentences.&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="color: #9f1111; font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: 14px; font-weight: bold; padding-top: 10px;"&gt;
Comparing Translation Engines - Initial Assessment Checklist&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-top: 0px; padding-top: 0px; text-align: justify;"&gt;
Language Studio™ can be used for calculating BLEU, TER, F-Measure and METEOR
                                            scores.
                                        &lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-left: -15px;"&gt;
&lt;li&gt;&lt;b&gt;All conditions of the Basic Test Set Criteria must be met: &lt;/b&gt;If
 any condition
                                                is not met, then the 
results of the test could be flawed and not meaningful or reliable.&lt;/li&gt;
&lt;b&gt;Test set must be consistent:&lt;/b&gt;
 The exact same test set must be used for comparison
                                            across all translation 
engines. Do not use different test sets for different engines.
&lt;li&gt;&lt;b&gt;Test sets should be “blind”:&lt;/b&gt;
 If the MT engine has seen the test set before
                                                or included the test set
 data in the training data, then the quality of the output
                                                will be artificially 
high and not represent the true quality of the system.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Tests must be carried out transparently: &lt;/b&gt;Where
 possible, submit the data
                                                yourself to the MT 
engine and get it back immediately. Do not rely on a third party
                                                to submit the data. If 
there are no tools or APIs for test set submission, the test
                                                set should be returned 
within 10 minutes of being submitted to the vendor via email.
                                                This removes any 
possibility of the MT vendor tampering with the output or fine
                                                tuning the engine based 
on the output.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Word Segmentation and Tokenization must be consistent: &lt;/b&gt;If
 Word Segmentation
                                                is required (i.e. for 
languages such as Chinese, Japanese and Thai) then the same
                                                word segmentation tool 
should be used on the reference translations and all the
                                                machine translation 
outputs. The same tokenization should also be used. &lt;a href="http://www.languagestudio.com/ToolsAndDownloads.aspx"&gt;Language                                                Studio™ Pro&lt;/a&gt; provides a 
simple means to ensure all tokenization is consistent
                                                with its embedded 
tokenization technology.&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="color: #9f1111; font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: 14px; font-weight: bold; padding-top: 10px;"&gt;
&lt;span style="font-size: small;"&gt;Ability to Improve is More Important than Initial Translation Engine Quality&lt;/span&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-top: 0px; padding-top: 0px; text-align: justify;"&gt;
The initial scores of a machine translation engine, while indicative of initial quality,
                                            should be viewed as a starting point for rapid improvement which is measured by
                                            the test set and BLEU scores. Depending on the volume and quality of data provided
                                            to the SMT vendor for training, the quality may be lower or higher. Most often, &lt;b&gt;more important
                                                than the initial quality is how quickly the translation engine quality improves&lt;/b&gt;.&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-top: 0px; padding-top: 0px; text-align: justify;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
Frequently a new translation engine will have gaps in vocabulary and grammatical
                                            coverage. &lt;b&gt;Other machine 
translation vendors’ engines do not improve at all or merely
                                                improve very little 
unless huge volumes of data are added to the initial training
                                                data.&lt;/b&gt; Most vendors 
recommend retraining once you have gathered a volume
                                            of additional data that is 
at least 20% of the size of the initial training data that the
                                            engine was trained on. Even 
when this volume of data is added, only a small improvement
                                            is achieved. As a result, 
very few translation engines evolve in quality much further
                                            than their initial quality.
                                        &lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
                                        &lt;/span&gt;&lt;img align="right" src="http://www.asiaonline.net/images/4stepcycle.png" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;" /&gt;
                                        &lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
In stark contrast, Language 
Studio™ translation engines are created with millions
                                            of sentences of data that 
Asia Online has prepared in addition to the data that
                                            the customer provides. The 
translation engines improve rapidly with a very small
                                            amount of feedback. It is 
not uncommon to get a 1-2 BLEU score improvement with
                                            as little as a few thousand 
post-edited sentences. Language Studio has a unique
                                            4 step approach that 
leverages the benefits of Clean Data SMT and manufactures additional
                                            learning data by directly 
analyzing the edits made to the machine translated output.
                                        &lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
Consequently, only a small 
amount of post-edited feedback can improve Language Studio™
                                            translation engine quality 
quite considerably, and it can do so at speeds much faster
                                            and with far less effort 
than with other machine translation vendors. &lt;span style="color: red;"&gt;
                                                &lt;i&gt;Asia Online provides 
complimentary Incremental Improvement Trainings to encourage
                                                    rapid translation 
engine quality improvement with every full customization and also
                                                    offers additional 
complimentary Incremental Improvement Trainings when word packages
                                                    are purchased, 
greatly reducing Total Cost of Ownership (TCO).&amp;nbsp;&lt;/i&gt;&lt;/span&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
&lt;span style="color: red;"&gt;&lt;i&gt;&amp;nbsp;&lt;/i&gt;&lt;/span&gt;
                                        &lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
&lt;b&gt;An investment in quality at 
the development stages of a translation engine impacts
                                            and reduces the cost of post
 editing directly, while increasing post editing productivity.&lt;/b&gt;
                                            While the development of some rules, 
normalization, glossary and non-translatable term work will assist
                                            in the rate of improvement,
 the fastest and most efficient way to improve Language
                                            Studio™ engines is to post 
edit the translations and feed them back into Language
                                            Studio™ for processing. The 
edits will be analyzed and new training data will
                                            be generated, directly 
addressing the primary cause of most errors. In other words,
                                            just post editing as part of
 a normal project will result in an immediate improvement.
                                            Little or no other extra 
effort is needed. By leveraging the standard post editing
                                            process, the effort and cost
 of improvement as well as the volume of data required
                                            in order to improve is 
greatly reduced.&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
Depending on the initial training data provided by the client, a small number of
                                            Incremental Improvement Trainings are usually sufficient for most Language Studio™
                                            translation engines to improve to a quality level approaching near-human quality.&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
Other machine translation 
vendors are now also claiming to build systems based on
                                            Clean Data SMT. Closer 
investigation reveals that their definition of “cleaning”
                                            is not the same as Asia 
Online. Removing formatting tags is not cleaning data.
                                            Language Studio™ analyzes 
translation memories and other training data and
                                            ensures that only the 
highest quality in domain data from trusted sources is included
                                            in the creation of your 
custom engine. The result is that improvements are rapid.
                                            Even with just a few 
thousand segments edited, the improvements are notable. When
                                            combined with Language 
Studio™ hybrid rules and an SMT approach to machine
                                            translation the quality of 
the translation output can increase by as much as 10,
                                            20 or even 30 BLEU points 
between versions.
                                        &lt;/div&gt;
&lt;div style="color: #9f1111; font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: 14px; font-weight: bold; padding-top: 10px;"&gt;
Comparing Translation Engines – Translation Quality Improvement Assessment&lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-left: -15px;"&gt;
&lt;li&gt;&lt;b&gt;Comparing Versions:&lt;/b&gt;
 When comparing improvements between versions of a translation
                                                engine from a single 
vendor, it is possible to work with just one test set, but
                                                the vendor must ensure 
that the test set remains “blind” and that the scores are
                                                not biased towards the 
test set. Only then can a meaningful representation of quality
                                                improvement be achieved.&lt;/li&gt;
&lt;li&gt;&lt;b&gt;Comparing Machine Translation Vendors:&lt;/b&gt;
 When comparing translation engine
                                                output from different 
vendors, a second “blind” test set is often needed to measure
                                                improvement. While you 
can use the first test set, it is often difficult to ensure
                                                that the vendor did not 
adapt its system to better suit and be biased towards the
                                                test set and in doing so
 delivering an artificially high score. It is also possible
                                                for the test 
set data to be added to engines training data which will
                                                also bias the score.&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
As a general rule, if you 
cannot be 100% certain that the vendor has not included
                                            the first test set data or 
adapted the engine to suit the test set, then a second
                                            “blind” test set is 
required. When a second test set is used, a measurement should
                                            be taken from the original 
translation engine and compared to the improved translation
                                            engine to give a meaningful 
result that can be trusted and relied upon.
                                        &lt;/div&gt;
&lt;div style="color: #9f1111; font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: 14px; font-weight: bold; padding-top: 10px;"&gt;
Bringing It All Together
                                        &lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-top: 0px; padding-top: 0px; text-align: justify;"&gt;
The table below shows a real
 world example of a version 1 translation engine from
                                            Asia Online and an improved 
version after feedback. Additional rules were added
                                            to the translation to meet 
specific client requirements, which resulted in
                                            considerable improvement in 
translation quality. This is part of Asia Online’s standard
                                            customization process. 
Language Studio™ puts a very high level of control
                                            in the customer’s hands 
where rules, runtime glossaries, non-translatable terms
                                            and other customization 
features &lt;b&gt;ensure the quality of the output is as close to
                                            human quality and requires 
the least amount of editing possible.&amp;nbsp;&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; margin-top: 0px; padding-top: 0px; text-align: justify;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
                                        &lt;/span&gt;&lt;br /&gt;
&lt;table border="0" cellpadding="0" cellspacing="0" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
                                            &lt;tbody&gt;
&lt;tr&gt;
                                                &lt;td rowspan="2" style="color: #9f1111; font-size: 18px; font-weight: bold; padding-right: 3px; text-align: left;" valign="bottom"&gt;BLEU Score&lt;br /&gt;
Comparisons&lt;br /&gt;
&lt;div style="color: #9f1111; font-size: 14px; font-weight: bold; padding-right: 3px; padding-top: 10px;"&gt;
Case Sensitive&lt;/div&gt;
&lt;/td&gt;
                                                &lt;td colspan="3" nowrap="nowrap" style="background: #92D050; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;" valign="bottom"&gt;Asia Online
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;" valign="bottom"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;" valign="bottom"&gt;&lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;" valign="bottom"&gt;&lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td nowrap="nowrap" style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center; width: 50px;" valign="bottom"&gt;V1&lt;br /&gt;
SMT
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center; width: 50px;" valign="bottom"&gt;V2&lt;br /&gt;
SMT
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center; width: 50px;" valign="bottom"&gt;V2&lt;br /&gt;
SMT +
                                                    &lt;br /&gt;
Rules
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #E5B8B7; border-right: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center; width: 50px;" valign="bottom"&gt;Google
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #CCC0D9; border-right: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center; width: 50px;" valign="bottom"&gt;Bing
                                                &lt;/td&gt;
                                                &lt;td nowrap="nowrap" style="background: #B6DDE8; border-right: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center; width: 50px;" valign="bottom"&gt;Systran
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td&gt;Reference 1
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;36.05
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;45.96
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;56.59
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;30.58
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;29.64
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;21.01
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td&gt;Reference 2
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;35.80
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;39.31
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;48.85
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;32.05
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;29.94
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;22.56
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td&gt;Reference 3
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;38.65
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;52.31
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;65.03
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;35.51
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;33.17
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;24.68
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td nowrap="nowrap" style="font-weight: bold; padding-right: 3px;"&gt;Combined References
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-bottom: 1px solid black; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;50.45
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;66.52
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;80.48
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;44.58
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;41.65
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;30.26
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td nowrap="nowrap" style="color: #9f1111; font-size: 14px; font-weight: bold; padding-right: 3px; padding-top: 6px;"&gt;Case Insensitive
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC;"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C;"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050;"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7;"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9;"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8;"&gt;&amp;nbsp;
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td&gt;Reference 1
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;41.30
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;52.65
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;59.25
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;32.18
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;31.49
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;22.49
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td&gt;Reference 2
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;41.01
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;45.32
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;51.24
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;33.67
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;31.64
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;23.88
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td&gt;Reference 3
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;43.99
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;58.97
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;67.49
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;37.15
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;35.01
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-right: 1px solid black; border-top: 1px solid black; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;25.92
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;tr&gt;
                                                &lt;td style="font-weight: bold;"&gt;Combined References
                                                &lt;/td&gt;
                                                &lt;td style="background: #D6E3BC; border-bottom: 1px solid black; border-left: 1px solid black; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;56.83
                                                &lt;/td&gt;
                                                &lt;td style="background: #B8E08C; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;74.35
                                                &lt;/td&gt;
                                                &lt;td style="background: #92D050; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;82.89
                                                &lt;/td&gt;
                                                &lt;td style="background: #E5B8B7; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;46.26
                                                &lt;/td&gt;
                                                &lt;td style="background: #CCC0D9; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;43.68
                                                &lt;/td&gt;
                                                &lt;td style="background: #B6DDE8; border-bottom: 1px black solid; border-right: 1px solid black; border-top: 1px solid black; font-weight: bold; padding-bottom: 3px; padding-left: 3px; padding-right: 3px; text-align: center;"&gt;31.68
                                                &lt;/td&gt;
                                            &lt;/tr&gt;
&lt;/tbody&gt;&lt;/table&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; font-size: smaller; font-style: italic; font-weight: bold; text-align: right;"&gt;
*Language Pair: English into French. &amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;Domain: Information
                                            Technology.&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
It can be seen clearly from 
the scores above that when all three human reference
                                            translations are combined 
the BLEU score is significantly higher and that the BLEU
                                            scores vary considerably 
between each of the human reference translations. The impact
                                            of the improvement and the 
application of client specific rules can also be seen,
                                            raising the case sensitive 
BLEU score from 50.45 to 80.48 (an increase of 30.03
                                            in just one improvement 
iteration). One interesting side effect of having multiple
                                            human references is that it 
is often possible to judge the quality of the human
                                            reference also. In the 
example above, the machine translation output is much closer
                                            to human reference 3, 
indicating a higher quality reference. The client later confirmed
                                            that the editor who prepared
 the reference was a senior editor and more skilled
                                            than the other 2 editors who
 prepared human reference 1 and 2.&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
                                        &lt;/span&gt;&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: justify;"&gt;
A BLEU score, as with other 
translation metrics, is just a meaningless number unless
                                            it is established in a 
controlled environment. Asking “What is your BLEU score?”
                                            could result in any one of 
the above scores being given. When controls are applied,
                                            translation metrics can be 
used both to measure improvements in a translation engine
                                            and compare translation 
engines from different vendors. However, while automated
                                            metrics are useful, the 
ultimate measurement is still a human assessment. Language Studio™
                                            Pro also provides tools to 
assist in delivering balanced, repeatable and meaningful metrics
                                            for human quality 
assessment.
                                        &lt;/div&gt;
&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-1117184695993454900?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/vkDl7s4zTRDEaZ0h8OeO0O765as/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/vkDl7s4zTRDEaZ0h8OeO0O765as/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/vkDl7s4zTRDEaZ0h8OeO0O765as/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/vkDl7s4zTRDEaZ0h8OeO0O765as/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=5I3QnbOB8KI:FHtMwNql2XU:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=5I3QnbOB8KI:FHtMwNql2XU:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=5I3QnbOB8KI:FHtMwNql2XU:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=5I3QnbOB8KI:FHtMwNql2XU:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/5I3QnbOB8KI" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/1117184695993454900/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2012/01/short-guide-to-measuring-and-comparing.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/1117184695993454900?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/1117184695993454900?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/5I3QnbOB8KI/short-guide-to-measuring-and-comparing.html" title="A Short Guide to Measuring and Comparing Machine Translation Engines" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><thr:total>0</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2012/01/short-guide-to-measuring-and-comparing.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CUUMR3c8fSp7ImA9WhRUFUk.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-1503896305335051575</id><published>2011-12-29T16:22:00.001-08:00</published><updated>2012-01-25T18:01:26.975-08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-25T18:01:26.975-08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="Post-editing" /><category scheme="http://www.blogger.com/atom/ns#" term="SMT" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><title>Review: Most Popular Blog Posts from 2011</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;blockquote class="tr_bq"&gt;
&lt;h5 style="font-weight: normal;"&gt;





&lt;span style="font-size: small;"&gt;&lt;b style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;i&gt;&lt;span class="ldquo"&gt;“&lt;/span&gt;Blogs 
are about sharing with authenticity. A good blog can help you really 
connect deeply with your audience in a meaningful way because the 
content is not only relevant but insightful and personal. &lt;/i&gt;&lt;i&gt; I think most enterprises miss that point. When you do it right, your 
customers will walk away not only having learned something new but will 
also feel much more connected to your brand&lt;/i&gt;&lt;/b&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;.&lt;/span&gt;&lt;b style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;i&gt;&lt;span class="rdquo"&gt;”&lt;/span&gt;&lt;/i&gt;&lt;/b&gt;&lt;/span&gt;&lt;b style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;i&gt;&lt;span style="font-size: small;"&gt;&amp;nbsp;&amp;nbsp;&lt;/span&gt;&amp;nbsp;&amp;nbsp; &lt;/i&gt;David Armano&lt;/b&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt; EVP, Global Innovation &amp;amp; Integration at &lt;/span&gt;&lt;a href="http://www.edelmandigital.com/" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;Edelman Digital&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt; &lt;/span&gt;&lt;/span&gt;&lt;/h5&gt;
&lt;/blockquote&gt;
&lt;div class="colored-panel"&gt;
&lt;blockquote&gt;
&lt;div style="text-align: left;"&gt;
&lt;i&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;b&gt;Don’t say anything online that you wouldn’t want plastered on a billboard with your face on it&lt;/b&gt;. &lt;/span&gt;-- &lt;/i&gt;&lt;i style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;b&gt;Erin Bury&lt;/b&gt;&lt;/i&gt;&lt;/div&gt;
&lt;/blockquote&gt;
&lt;br /&gt;
&amp;nbsp;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;One of the things that I enjoy about blogging is the feedback that one gets, and the continuing and evolving&amp;nbsp; discussion that sometimes comes forth from these posts. I find it helps to clarify my thinking on what really matters, and the critical feedback one gets, on assumptions that may previously go unquestioned is very useful in just evolving my own thinking on these issues. The feedback and the rankings helps me, and others too, I think, to understand what &lt;a href="http://www.thefreedictionary.com/strike+a+chord"&gt;strikes a chord&lt;/a&gt; in the reader community, and can also sometimes help to guide further evolutionary thinking on the subjects at hand. This is is a ranking of the most popular (Unique Visitors and Page Views) posts of the year based on the data provided by Google Analytics.&lt;/span&gt;&lt;/div&gt;
&lt;ol&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/06/analysis-of-shutdown-announcements-of.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;Analysis of the Shutdown Announcements of the Google Translate API&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt; and the &lt;/span&gt;&lt;a href="http://kv-emptypages.blogspot.com/2011/07/google-translate-api-furor-analysis-of.html" style="font-weight: normal;"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;subsequent posts&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; on what this may mean for the translation industry were by far the most popular posts of the year. The original post authored by Dion Wiggins was also referenced by the &lt;/span&gt;&lt;a href="http://www.theatlantic.com/technology/archive/2011/06/an-economic-burden-google-can-no-longer-bear/240283/" style="font-weight: normal;"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;Atlantic&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; and&amp;nbsp; other mainstream media and still continues to be an influential view on the announcement today, probably much more so than any other publicly offered opinion in the professional translation industry.&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/09/continuing-saga-evolution-of-machine.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;The Continuing Saga &amp;amp; Evolution of Machine Translation&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; &lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;was coverage of the IMTT 7th Conference in Cordoba triggered active debates and discussions MT, automation and translator compensation in several forums and clearly struck a chord for many.&lt;/span&gt;&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/03/future-of-translation-memory-tm.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;The Future of Translation Memory (TM)&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; is a posting that continues to receive high new visit rates long after it was originally published.&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/10/building-momentum-for-post-edited.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;The Building Momentum for Post-Edited Machine Translation (PEMT)&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; a number of case studies on the increasing use of post-edited MT to meet business timeliness and production cost requirements. &lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/01/end-of-road-for-more-data-better.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;Has Google Translate Reached the Limits of its Ongoing Improvement?&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; More evidence that more data Is not always better especially for MT, but even for Search, and the many reasons to consider the data quality, yet again.&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/09/growing-interest-concern-about-future.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;The Growing Interest &amp;amp; Concern About the Future of Professional Translation&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; About reactions to the changes underway in translation&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/05/standards-importance-of-measurement.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;Standards: the Importance of Measurement&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; A guest post by Valeria Cannavina on how standards can drive quality improvements&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/12/moses-madness-and-dead-flowers.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;The Moses Madness and Dead Flowers&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; A post that questions some of the assumptions made by “instant Moses” advocates and challenges the long-term value of these experiments. Strong opinions voiced in the comments.&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/08/translation-crowdsourcing.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;Translation Crowdsourcing&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; An exploration of the driving forces underlying successful translation crowdsourcing efforts.&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;li&gt;     &lt;h5&gt;









&lt;a href="http://kv-emptypages.blogspot.com/2011/02/exploration-of-post-editing-mt-part-i.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;An Exploration of Post-Editing MT – Part I&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small; font-weight: normal;"&gt; Discussion on the nature and compensation of post-editing MT work.&lt;/span&gt;&lt;/h5&gt;
&lt;/li&gt;
&lt;/ol&gt;
&lt;h5&gt;









&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;&lt;/span&gt;&lt;/h5&gt;
&lt;div style="text-align: center;"&gt;
&lt;b&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;span style="font-size: large;"&gt;&lt;i&gt;Please Repeat:&amp;nbsp;Influence is NOT Popularity&lt;/i&gt;!&amp;nbsp;&lt;/span&gt; --&amp;nbsp; &lt;/span&gt;&lt;i style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;b&gt;Brian Solis&lt;/b&gt;&lt;/i&gt;&lt;/b&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;&lt;b&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt; &lt;/span&gt;&lt;/b&gt;&lt;/span&gt;&lt;/div&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;While reader traffic is one way to measure the impact of articles, there are also other ways that capture the relative influence of individual posts.&lt;a href="http://www.postrank.com/"&gt; PostRank&lt;/a&gt; is one such measure that I think monitors how others reference the posts, and monitors where and when content generates meaningful interactions across the web. They provide a truer picture of the relative influence and impact of individual blog posts, and thus I include the latest PostRank snapshot here. (&lt;i&gt;You can link to the posts through the table on the right of this blog text).&amp;nbsp; &lt;/i&gt;This table shows that some articles that may not have had high direct readership may actually be much more useful to readers and it is interesting to see how different the two lists are though it is clear that the analysis of the Google Translate API shutdown/pay-wall was a major hit no matter how you look at it.&amp;nbsp; &lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;a href="http://lh3.ggpht.com/-mXVKcijjmvo/Tv0ERC-lBnI/AAAAAAAAATo/hmcihplajvQ/s1600-h/image%25255B2%25255D.png"&gt;&lt;span style="font-family: Trebuchet MS;"&gt;&lt;img alt="image" border="0" height="244" src="http://lh3.ggpht.com/-fcuiUT3XnUM/Tv0ERdtw1YI/AAAAAAAAATw/0kXU5LxJXos/image_thumb.png?imgmax=800" style="background-image: none; border-bottom: 0px; border-left: 0px; border-right: 0px; border-top: 0px; display: block; float: none; margin-left: auto; margin-right: auto; padding-left: 0px; padding-right: 0px; padding-top: 0px;" title="image" width="153" /&gt;&lt;/span&gt;&lt;/a&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;It is also interesting to note that some older posts continue to strike a chord with readers and remain active in terms of visibility because the themes are longer lived and also perhaps because they ring true. The &lt;/span&gt;&lt;a href="http://kv-emptypages.blogspot.com/2010/05/are-there-any-standards-in-translation.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;original post on standards&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt; and some of the posts &lt;/span&gt;&lt;a href="http://kv-emptypages.blogspot.com/2010/04/falling-translation-prices-and.html"&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;discussing disintermediation&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt; were also posts that generate continuing interest and continue to show up in both the Google Analytics and PostRank ratings.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;I have noticed that we are getting more clarity on post-editing MT work in many different ways including new models for more equitable compensation. I am hoping to highlight best practices in this area in the coming year as I believe it will be critical to ongoing adoption and success with MT technology. I also think there will be much more to share on best practices of post-editing MT and I expect that we may find that it is not quite the dreaded beast it has often been portrayed to be.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;blockquote class="tr_bq"&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Social Media is not just a set of new channels for marketing messages. 
It’s an opportunity for organizations to align with the marketplace and 
start delivering on behalf of customers&amp;nbsp; &lt;i&gt;&lt;b&gt;-- Valeria Maltoni, conversationagent.com&lt;/b&gt;&lt;/i&gt;&lt;/b&gt;&lt;/div&gt;
&lt;/blockquote&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;I would also like to invite some of you to contribute to the discussion in this blog (guest posts) and assure you that I believe in open discourse and think it is useful for many different viewpoints to be aired to get closer to the “truth”. So please don’t hesitate to send me contributions that you think might be interesting to the audience that has been following this blog. I thank you for your support and I hope that the content here will continue to earn your interest and comments to extend the discussion beyond my thoughts on key issues.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;For those who are not aware, there are some very interesting videos from presentations at TAUS that I reported on in the 4th ranked posting above on PEMT momentum. &amp;nbsp;&amp;nbsp;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;!--[if gte mso 9]&gt;&lt;xml&gt;
 &lt;o:OfficeDocumentSettings&gt;
  &lt;o:AllowPNG/&gt;
 &lt;/o:OfficeDocumentSettings&gt;
&lt;/xml&gt;&lt;![endif]--&gt;&lt;!--[if gte mso 9]&gt;&lt;xml&gt;
 &lt;w:WordDocument&gt;
  &lt;w:View&gt;Normal&lt;/w:View&gt;
  &lt;w:Zoom&gt;0&lt;/w:Zoom&gt;
  &lt;w:TrackMoves/&gt;
  &lt;w:TrackFormatting/&gt;
  &lt;w:PunctuationKerning/&gt;
  &lt;w:ValidateAgainstSchemas/&gt;
  &lt;w:SaveIfXMLInvalid&gt;false&lt;/w:SaveIfXMLInvalid&gt;
  &lt;w:IgnoreMixedContent&gt;false&lt;/w:IgnoreMixedContent&gt;
  &lt;w:AlwaysShowPlaceholderText&gt;false&lt;/w:AlwaysShowPlaceholderText&gt;
  &lt;w:DoNotPromoteQF/&gt;
  &lt;w:LidThemeOther&gt;EN-US&lt;/w:LidThemeOther&gt;
  &lt;w:LidThemeAsian&gt;X-NONE&lt;/w:LidThemeAsian&gt;
  &lt;w:LidThemeComplexScript&gt;HI&lt;/w:LidThemeComplexScript&gt;
  &lt;w:Compatibility&gt;
   &lt;w:BreakWrappedTables/&gt;
   &lt;w:SnapToGridInCell/&gt;
   &lt;w:WrapTextWithPunct/&gt;
   &lt;w:UseAsianBreakRules/&gt;
   &lt;w:DontGrowAutofit/&gt;
   &lt;w:SplitPgBreakAndParaMark/&gt;
   &lt;w:EnableOpenTypeKerning/&gt;
   &lt;w:DontFlipMirrorIndents/&gt;
   &lt;w:OverrideTableStyleHps/&gt;
  &lt;/w:Compatibility&gt;
  &lt;m:mathPr&gt;
   &lt;m:mathFont m:val="Cambria Math"/&gt;
   &lt;m:brkBin m:val="before"/&gt;
   &lt;m:brkBinSub m:val="&amp;#45;-"/&gt;
   &lt;m:smallFrac m:val="off"/&gt;
   &lt;m:dispDef/&gt;
   &lt;m:lMargin m:val="0"/&gt;
   &lt;m:rMargin m:val="0"/&gt;
   &lt;m:defJc m:val="centerGroup"/&gt;
   &lt;m:wrapIndent m:val="1440"/&gt;
   &lt;m:intLim m:val="subSup"/&gt;
   &lt;m:naryLim m:val="undOvr"/&gt;
  &lt;/m:mathPr&gt;&lt;/w:WordDocument&gt;
&lt;/xml&gt;&lt;![endif]--&gt;&lt;!--[if gte mso 9]&gt;&lt;xml&gt;
 &lt;w:LatentStyles DefLockedState="false" DefUnhideWhenUsed="true"
  DefSemiHidden="true" DefQFormat="false" DefPriority="99"
  LatentStyleCount="267"&gt;
  &lt;w:LsdException Locked="false" Priority="0" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Normal"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="heading 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 7"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 8"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 9"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 7"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 8"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 9"/&gt;
  &lt;w:LsdException Locked="false" Priority="35" QFormat="true" Name="caption"/&gt;
  &lt;w:LsdException Locked="false" Priority="10" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Title"/&gt;
  &lt;w:LsdException Locked="false" Priority="1" Name="Default Paragraph Font"/&gt;
  &lt;w:LsdException Locked="false" Priority="11" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Subtitle"/&gt;
  &lt;w:LsdException Locked="false" Priority="22" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Strong"/&gt;
  &lt;w:LsdException Locked="false" Priority="20" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Emphasis"/&gt;
  &lt;w:LsdException Locked="false" Priority="59" SemiHidden="false"
   UnhideWhenUsed="false" Name="Table Grid"/&gt;
  &lt;w:LsdException Locked="false" UnhideWhenUsed="false" Name="Placeholder Text"/&gt;
  &lt;w:LsdException Locked="false" Priority="1" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="No Spacing"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" UnhideWhenUsed="false" Name="Revision"/&gt;
  &lt;w:LsdException Locked="false" Priority="34" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="List Paragraph"/&gt;
  &lt;w:LsdException Locked="false" Priority="29" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Quote"/&gt;
  &lt;w:LsdException Locked="false" Priority="30" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Intense Quote"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="19" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Subtle Emphasis"/&gt;
  &lt;w:LsdException Locked="false" Priority="21" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Intense Emphasis"/&gt;
  &lt;w:LsdException Locked="false" Priority="31" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Subtle Reference"/&gt;
  &lt;w:LsdException Locked="false" Priority="32" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Intense Reference"/&gt;
  &lt;w:LsdException Locked="false" Priority="33" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Book Title"/&gt;
  &lt;w:LsdException Locked="false" Priority="37" Name="Bibliography"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" QFormat="true" Name="TOC Heading"/&gt;
 &lt;/w:LatentStyles&gt;
&lt;/xml&gt;&lt;![endif]--&gt;&lt;!--[if gte mso 10]&gt;
&lt;style&gt;
 /* Style Definitions */
 table.MsoNormalTable
 {mso-style-name:"Table Normal";
 mso-tstyle-rowband-size:0;
 mso-tstyle-colband-size:0;
 mso-style-noshow:yes;
 mso-style-priority:99;
 mso-style-parent:"";
 mso-padding-alt:0in 5.4pt 0in 5.4pt;
 mso-para-margin:0in;
 mso-para-margin-bottom:.0001pt;
 mso-pagination:widow-orphan;
 font-size:11.0pt;
 mso-bidi-font-size:10.0pt;
 font-family:"Calibri","sans-serif";
 mso-ascii-font-family:Calibri;
 mso-ascii-theme-font:minor-latin;
 mso-hansi-font-family:Calibri;
 mso-hansi-theme-font:minor-latin;
 mso-bidi-font-family:Mangal;
 mso-bidi-theme-font:minor-bidi;}
&lt;/style&gt;
&lt;![endif]--&gt;

&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; line-height: 11.25pt;"&gt;
&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;Videos of presentations and panels at the
recent TAUS User Conference in Santa Clara are now available on YouTube for
everyone. The links below will take you to playlists on specific themes:&amp;nbsp;&lt;/span&gt;&lt;span style="font-size: 10pt;"&gt;&lt;/span&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: left;"&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PL4B167B80018A01C5" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;The
multilingual web – “beyond the translate button”&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PL859FAD1ED8341AA9&amp;amp;feature=viewall" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;Open Translation Platforms&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PL163F2AC22467C301&amp;amp;feature=viewall" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;TAUS members share Moses-related tools, making others’ lives
easier&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PLAAD4375300672AC5&amp;amp;feature=viewall" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;The Great Interoperability Debate&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PLC8325A67E789E015&amp;amp;feature=viewall" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;Machine Translation Use Cases&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PL0B4C900CEEDB739F&amp;amp;feature=edit_ok" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;R/time Multilingual Chat and Spoken Translation&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PL3115D8C111A99754&amp;amp;feature=viewall" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;Researchers on Future Translation Technologies&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="background: none repeat scroll 0% 0% rgb(247, 247, 247); color: #676767; font-size: 10pt;"&gt;&lt;a href="http://www.youtube.com/playlist?list=PL46934396EAC94241&amp;amp;feature=viewall" style="border-color: initial; border-style: initial;" target="_blank"&gt;&lt;span style="border: none windowtext 1.0pt; color: #676767; mso-border-alt: none windowtext 0in; padding: 0in;"&gt;Collaborative Translation and Innovating Pricing&lt;/span&gt;&lt;/a&gt;&lt;/span&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS; font-size: small;"&gt;I wish you all a wonderful holiday season and look forward to sharing observations in the coming year, a year that many say will be a turning point across many dimensions.&lt;/span&gt;&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-1503896305335051575?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/ORXqmG9kdWjtjh4pAdVO-KFrAo8/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/ORXqmG9kdWjtjh4pAdVO-KFrAo8/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/ORXqmG9kdWjtjh4pAdVO-KFrAo8/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/ORXqmG9kdWjtjh4pAdVO-KFrAo8/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=tZ68YoR0XUw:7cm0lNeuFAQ:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=tZ68YoR0XUw:7cm0lNeuFAQ:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=tZ68YoR0XUw:7cm0lNeuFAQ:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=tZ68YoR0XUw:7cm0lNeuFAQ:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/tZ68YoR0XUw" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/1503896305335051575/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/12/review-top-blog-posts-from-2011.html#comment-form" title="0 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/1503896305335051575?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/1503896305335051575?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/tZ68YoR0XUw/review-top-blog-posts-from-2011.html" title="Review: Most Popular Blog Posts from 2011" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://lh3.ggpht.com/-fcuiUT3XnUM/Tv0ERdtw1YI/AAAAAAAAATw/0kXU5LxJXos/s72-c/image_thumb.png?imgmax=800" height="72" width="72" /><thr:total>0</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/12/review-top-blog-posts-from-2011.html</feedburner:origLink></entry><entry gd:etag="W/&quot;AkEGRHo_cSp7ImA9WhRVFEU.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-7715058610882400555</id><published>2011-12-02T01:48:00.001-08:00</published><updated>2012-01-13T13:03:45.449-08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-13T13:03:45.449-08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="Moses" /><category scheme="http://www.blogger.com/atom/ns#" term="SMT" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><title>The Moses Madness and Dead Flowers</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Machine translation technology has an unfortunate history of overpromising and under delivering. At least 50 years of doing this and sometimes it seems that the torture will never stop. MT enthusiasts continue to make promises that often greatly exceed the realistic possibilities. Recently, in various conversations, I have seen that the level of unwarranted exuberance around the possibilities with the Moses Open Source SMT technology is rising to peak levels. This is especially true in the LSP community. &lt;b&gt;While most technologies go through a single hype cycle, MT seems destined to go through several of these cycles with each new approach and the latest of these is what I call Moses Madness.&lt;/b&gt; It has become fashionable of late to build instant DIY MT engines, using tools that help you with the mechanics of running the &lt;/span&gt;&lt;a href="http://en.wikipedia.org/wiki/Moses_%28machine_translation%29"&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;software that is “Moses”&lt;/span&gt;.&lt;/a&gt;&lt;span style="font-family: Trebuchet MS;"&gt;&amp;nbsp; &lt;b&gt;While some of these tools greatly simplify the mechanical process of running the Moses software, they do not give you any insight into what is really going on inside the magic box&lt;/b&gt; or any clues to what you are doing at all.&amp;nbsp; Moses is a wonderful technology and it enables all kinds of experimentation that furthers the art and science of data-driven MT, but it does require some knowledge and understanding for real success. It is possible to get a quick and dirty MT engine together using some of these tools, but for long-term strategic translation production leverage, I am not so sure. Thus it is my sense that we are at the peak of the &lt;a href="http://en.wikipedia.org/wiki/Hype_cycle"&gt;hype cycle&lt;/a&gt; for DIY Moses. &lt;/span&gt;&lt;br /&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://1.bp.blogspot.com/-zSo5BWZKo2w/TulvNvHrAlI/AAAAAAAAATc/b4tUNitUMmQ/s1600/MosesMadness.png" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" height="240" src="http://1.bp.blogspot.com/-zSo5BWZKo2w/TulvNvHrAlI/AAAAAAAAATc/b4tUNitUMmQ/s320/MosesMadness.png" width="320" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;div align="center"&gt;
&lt;/div&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;I would like to present a somewhat contrarian viewpoint to much of what you will hear at TAUS - &lt;a href="http://www.translationautomation.com/best-practices/let-a-thousand-mt-systems-bloom.html"&gt;“Let a thousand MT systems bloom”&lt;/a&gt;,&amp;nbsp; and other online forums on getting started with instant MT approaches&lt;/b&gt;.&amp;nbsp; IMO Moses and especially instant Moses is clearly not the final answer. While Moses is a starting point for real development, it should not be mistaken as the final destination. I think there are a number of reasons that you should pause before you jump in, and at least build up some knowledge before taking the dive. I have attempted to enumerate some of these reasons, but I am sure some will disagree. Anyway, I hope an open discussion will be valuable in reaching a more sustainable and accurate view of the reality and so here goes, even though perhaps I am rushing in where angels fear to tread.&amp;nbsp; And of course my opinion on this matter is not impartial, given my involvement with Asia Online. &lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;b&gt;&lt;span style="font-family: Trebuchet MS; font-size: medium;"&gt;The Sheer Complexity&lt;/span&gt;&lt;/b&gt;&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;As you can see from &lt;a href="http://www.statmt.org/moses/?n=Moses.GetInvolved"&gt;the official description&lt;/a&gt;, Moses is an open source project that makes its home in the academic research community. &lt;a href="http://www.statmt.org/moses/?n=Moses.GetInvolved"&gt;This link describes some of the conferences&lt;/a&gt; where people with some expertise and understanding of what Moses &lt;b&gt;actually does&lt;/b&gt; convene and share information. Take a look at the program committee of these conferences to get a sense of what the focus might be.&lt;b&gt; Now take a look at the &lt;/b&gt;&lt;a href="http://www.statmt.org/moses_steps.html"&gt;&lt;b&gt;“ step-by-step guide”,&lt;/b&gt;&lt;/a&gt;&lt;b&gt; which students in NLP are expected to be able to handle. It is what you would have to do to build an MT system if did not have the DIY kit.&amp;nbsp; Most of the instant/simplified Moses engine services in the market focus on simplifying this &lt;u&gt;and only this&lt;/u&gt; aspect of developing an MT engine&lt;/b&gt;.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Clearly it would be good to have some knowledge of what is going on in the magic box BEFORE you begin, and perhaps it would even be really nice to have some limited team expertise with computational linguistics to make your exploration more useful. &lt;b&gt;Remember that hiding complexity is not quite the same as removing complexity, and it would be smart to not underestimate this complexity BEFORE you begin.&lt;/b&gt; Anybody who has ventured into this has probably realized already, that while some of the complexity has been hidden, there is still much that is ugly and complicated to deal with in Moses world, and often it feels like the blind leading the blind.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;I have noticed that many in professional translation industry have trouble even with basics like MT system BLEU scoring, and even some alleged MT experts barely know how to measure BLEU accurately and fairly. Thus I am skeptical that LSPs will be able to jump into this with any real level of competence in the short term. A level of competence that assures or at least raises the probability of business success i.e. enhances long-term translation productivity. Though it is possible that a hardy few will learn over the next 2-5 years, it is also clear that NLP and computational linguistics is not for everyone. The level and extent of knowledge required is simply too specialized and vast. As Richard Feynman said:”I think it’s much more interesting to live not knowing, than to have answers which might be wrong.” (&lt;i&gt;Though he was talking about beauty, curiosity &lt;/i&gt;&lt;a href="http://www.npr.org/blogs/krulwich/2011/11/25/142702452/after-ohio-state-clobbers-michigan-cuddle-up-with-professor-feynman?ft=1&amp;amp;f=5500502"&gt;&lt;i&gt;and mostly about doubt).&lt;/i&gt;&lt;/a&gt;&lt;i&gt;&amp;nbsp;&lt;/i&gt;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;a href="http://www.linkedin.com/profile/view?id=2846244&amp;amp;authType=name&amp;amp;authToken=KJxS&amp;amp;goback=.gmp_2866905&amp;amp;trk=anet_mfeed_profile"&gt;Alon Lavie&lt;/a&gt;, AMTA President, CMU NLP professor and President of Safaba &lt;i&gt;(which develops hosted MT solutions that are largely built on top of Moses)&lt;/i&gt; says:&lt;/span&gt; &lt;br /&gt;
“ I am of course a strong supporter, and am extremely enthusiastic about Moses and what it has accomplished in both academic research and in the commercial space. I also think there is indeed a lot of value in the various DIY offerings (commercial and Achim's M4L efforts). But these efforts primarily target and solve the&lt;b&gt; *engineering complexity*&lt;/b&gt; of deploying Moses. While this undoubtedly is a critical bottleneck, I think there is a potential pitfall here that users that are not MT experts (the vast majority) would come to believe that that's all it takes to build a state-of-the-art MT system. The technology is actually complex and is getting more complex and involved to master. &lt;b&gt;Users may be disappointed with what they get from DIY Moses, and more detrimentally, become convinced that that's the best they can accomplish, when in fact letting expert MT developers do the work can result in far better performance results.&lt;/b&gt; I think this is an important message to communicate to potential users, but I'm not sure how best to communicate this message.”&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Thus, I will join Alon in trying to convey the message that Moses is a starting point in your exploration of MT and not the final answer, and that experience, expertise and knowledge matter. Perhaps, a way to understand the complexity issue better, is to use some analogies.&amp;nbsp; &lt;/span&gt;&lt;br /&gt;
&lt;a href="http://lh5.ggpht.com/-8HD8mqR_Low/Ttie7qrWH8I/AAAAAAAAAS0/UmonHFTmAsE/s1600-h/image6.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh5.ggpht.com/-xD6LAfbxfsY/Ttie74rdVwI/AAAAAAAAAS8/jxjabEKJHZA/image_thumb2.png?imgmax=800" style="background-image: none; border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto; padding-left: 0px; padding-right: 0px; padding-top: 0px;" title="image" width="244" /&gt;&lt;/a&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;The sewing machine/tailor analogy&lt;/b&gt;: Moses can be perhaps be viewed as a very basic sewing machine. You still need to understand how to cut cloth, stitching technique, fabric and lining selection, measurement, pocket technique (?), final fit modifications and so on to make clothes. Tailors do it better and expert tailors that only focus on men's suits do it even better than you or I would with the same sewing equipment. The closest to a ready made suit would be the free MT engines, except in this analogy they are only available in one size. Expertise really does matter folks if you want to customize-to-fit.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;The DIY car analogy:&lt;/b&gt; In this analogy, Moses is the car engine and perhaps a very basic chassis, one that would be dangerous on a highway or bumpy roads. The DIY task is to build a car that can actually be used as transportation. This will require some understanding of auto systems design, matching key components to each other, tires, braking systems, body design and so on. Finally you also need to learn to drive and you would want the car to turn right when you want to. Again, expert mechanics are more likely to be successful even though there are some great DIY kits out there for NASCAR enthusiasts.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;b&gt;&lt;span style="font-family: Trebuchet MS; font-size: medium;"&gt;The Learning Curve&lt;/span&gt;&lt;/b&gt;&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Even if you do have a team with some NLP expertise, remember that working with any complex technology involves a process of learning and usually an apprenticeship to get to a point of real skill. &lt;b&gt;The people who build SMT engines at Microsoft, Google, Asia Online and other MT research teams have built thousands of MT engines during their MT careers. The skills developed and lessons learned during this experience are not easily replicated and embedded into open source code. Failure is often the best teacher and most of these teams have failed often enough to understand the many pitfalls along an SMT engine development path. &lt;/b&gt;To expect that any “instant” Moses solution is going to capture and encapsulate all of this is naïve and and somewhat arrogant.&lt;b&gt; This is the kind of skill where expertise builds slowly, and comes after much experimentation across many different kinds of data and use case scenarios&lt;/b&gt;. Just as professional tailors and expert mechanics are likely to produce better results, MT experts who work across many different use scenarios are likely to produce much better results than a do-it-yourself enthusiast might. These results translate into long-term savings that should far exceed an initially higher price.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;The objective of MT deployment for most LSP users is to increase translation productivity. (Very few have reached the next phase where they are translating new content that would never be translated were it not for MT). Thus getting the best possible systems that produce the highest possible MT output quality really matters to achieve this core objective of achieving measurable translation productivity. To put this in simpler terms, the difference between instant Moses systems and expert MT systems could be as much as 4,000 words/day versus 10,000+ words a day. &lt;b&gt;Expert MT engine developers like Asia Online have multi-dimensional approaches, NLP skills, and many specialized tools in place to extract the maximum amount of information out of the data they have available. The use of these tools is &lt;/b&gt;&lt;a href="http://amta2010.amtaweb.org/cfp-tutorials_accepted_T5.html"&gt;&lt;b&gt;guided by two team members&lt;/b&gt;&lt;/a&gt;&lt;b&gt; with deep expertise on the inner workings of Moses and SMT in general&lt;/b&gt;. The learning process driving the development of these comprehensive tools takes years, and they enable Asia Online custom systems to produce superior translation output to the free online MT engines consistently. One team member has literally &lt;a href="http://homepages.inf.ed.ac.uk/pkoehn/"&gt;written the book on SMT&lt;/a&gt; and created Moses and thus one could presume is quite likely to have the expertise to develop better MT systems than most.&amp;nbsp;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;I have already heard from several translators who when asked to post-edit “instant Moses” output they know is inferior, simply run the same source material through Google/Bing and edit that instead, to improve their own personal productivity and save themselves some anguish&lt;/b&gt;. So if your Moses engine is not as good as these public engines you will find that translators will simply bypass them whenever they can. And they may not actually tell you that they are doing this. Post-editors will generally choose the best MT output they can get access to, so beware if your engine does not compare well. And buyers, insist on seeing how these instant MT engines compare to the public free engines on a meaningful and comprehensive test set, not just a 100 or so sentences.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;However, I am also aware that some Moses initiatives have produced great results &lt;a href="http://translate.autodesk.com/productivity.html"&gt;e.g. Autodesk&lt;/a&gt;,(&lt;i&gt;for you doubters on the value of PEMT, here is clear evidence from a customer viewpoint)&lt;/i&gt; and here I would caution against any extrapolation of these results and expectation to achieve this for any and every Moses attempt. The team that produced these systems were more technically capable and knowledgeable than most, and I am also aware that that their training data was better suited for SMT than most of the TM you will find in the TDA or on the web. And even here, I would argue that MT experts would probably produce better results with the same data especially with the Asian languages where other support tools and processes become much more imperative.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;As others have stated before me, the global population of people who actually understand how these data-driven systems work is really quite tiny, miniscule in fact&lt;/b&gt;. &lt;b&gt;If you are building Moses systems you should be comparing yourself to the public free engines, as you may find that all your effort was much ado about nothing&lt;/b&gt;. &lt;b&gt;One would hope that you will produce systems that compare favorably to these “free” options&lt;/b&gt;. And if your competition includes the lads and lassies at Microsoft and Google, one would hope that you know more about how to do this than pushing the instant Make-my-engine button. The financial cost of ignorance is substantially higher than most are able to define in terms of lost opportunity costs, and learning costs (a.k.a. mistakes) should be factored into a real TCO (Total Cost of Ownership).&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;The bottom line: Success with SMT requires very specialized skills that include, some NLP background, massive data handling skills, knowledge of parallel computing processing, linguistic data management tools, corpus analysis and linguistic structural analysis capabilities for optimal results not to mention a culture that nurtures collaboration with translators.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;b&gt;&lt;span style="font-family: Trebuchet MS; font-size: medium;"&gt;The Data, the Data, The Data&lt;/span&gt;&lt;/b&gt;&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Moses is a data-driven technology and thus is highly dependent on the data that is used. Data volume is required to get good output from the systems and thus users have to gather the data from public sources and it is important to normalize and prepare the data for optimal performance. Most LSPs will not have the data or skills needed to gather the data in an optimal way.&lt;b&gt; I have seen two major SMT engineering initiatives up close, one where training data was scraped off the web by spider programs, and another where data was not allowed to go into training data if it had not passed several human linguistic quality assessment checks. The differing impact of these approaches is quite striking.&lt;/b&gt; &lt;b&gt;The dirty data approach requires substantially larger amounts of new data to see any ongoing improvement, while the clean data approach can produce compelling improvement results with much less new data.&lt;/b&gt;&amp;nbsp;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt; This ability to respond to small amounts of corrective feedback is a critical condition for ongoing improvement, and for continued improvements in productivity e.g. raising PEMT throughput up to 15,000+ words/day in the shortest time possible. &lt;a href="http://kv-emptypages.blogspot.com/2011/10/building-momentum-for-post-edited.html"&gt;I have already stated&lt;/a&gt; that I was surprised how little attention is paid to data quality in instant Moses approaches presented at TAUS&lt;b&gt;.&lt;/b&gt; And while data volume matters, for high quality domain-focused systems, the data you exclude may be more important than what you include. We are in a phase of the web's development where ‘ Big Data” is solving many semantic and linguistic problems, but we have also seen that &lt;a href="http://kv-emptypages.blogspot.com/2011/01/end-of-road-for-more-data-better.html"&gt;data is not always the solution to better MT systems.&lt;/a&gt;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;The upfront data analysis and data preparation, the development of “good” tuning and test sets are critical to the the short and long-term quality and evolution of an MT engine. This is something that takes experience and experimentation to understand and be skillful at. Experts can add huge value at this formative stage. Remember that this is a technology where “Garbage In Garbage Out” (GIGO) will be particularly true. Many who understand how bad TM can get don’t need any further elaboration on this, even though some people in the SMT community remain unconvinced that clean data does matter.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;Many of the people who have jumped into instant Moses, do not realize that to get your initial MT engine to improve, will require very large amounts of new data with a standard Moses approach. The rule of thumb I have heard used frequently is that you need 20-25% of the initial training data volume to see meaningful improvements&lt;/b&gt;. &lt;b&gt;Thus, if you used 10 million words to build your system, you will need 2-3 million new words to see the system noticeably improve. So most of these instant systems are as good as they are ever going to get when the first engine is produced.&lt;/b&gt; In contrast, Asia Online systems can improve dramatically with as little as a few thousand sentences (a single project) and are architected and designed from the outset to improve continuously over time with focused and targeted corrective feedback.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Given the difficulty of getting large amounts of new data, users need systems that can respond to small amounts of corrective feedback and yet show noticeable improvements. One of the major deficiencies of historical MT systems has been the lack of user control, the inability of users to make any meaningful impact on the quality of raw output produced on an ongoing basis.&lt;b&gt;This ability to C&lt;u&gt;ONTINUALLY&lt;/u&gt; steer the MT engine with financially feasible amounts (&lt;/b&gt;i.e. relatively small&lt;b&gt;) of corrective feedback is a key to getting the best long-term productivity results and ROI. I think as users get more informed on how to work with this technology, they will zero in on this ability of some expert MT systems. IMO, it is the single most important criterion when evaluating competitive MT systems: &lt;/b&gt;&lt;/span&gt;&lt;br /&gt;
&lt;ul&gt;
&lt;li&gt;&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;What do I have to do to improve the raw system output quality once an initial engine is in place? &lt;/b&gt;&lt;/span&gt;&lt;/li&gt;
&lt;li&gt;&lt;span style="font-family: Trebuchet MS;"&gt;&lt;b&gt;And, how much effort/data is required to get meaningful and measurable improvements?&lt;/b&gt;&lt;/span&gt; &lt;/li&gt;
&lt;li&gt;&lt;b&gt;&lt;span style="font-family: Trebuchet MS;"&gt;Measurable = Rising average throughput of post-editors &lt;/span&gt;&lt;/b&gt;&lt;span style="font-family: Trebuchet MS;"&gt;(By hundreds or thousands of more words a day, and often a multiple of what is possible with instant MT)&lt;/span&gt;&lt;b&gt;&lt;span style="font-family: Trebuchet MS;"&gt;.&lt;/span&gt;&lt;/b&gt;&lt;/li&gt;
&lt;/ul&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;The issue of data cleaning is also not well understood. While it is helpful to remove tags and formatting information, it is also important to validate the linguistics and the quality of translations in addition to this to avoid GIGO results. Users should take care to keep data in the cleanest possible state (format wise and linguistically) as it can provide real long-term business production leverage on a scale greater than most TM data can. What most successful users will find is that 90%+ of the time spent in developing the highest quality engines is spent in corpus and data analysis, data preparation and organization, error detection and correction. The Moses step is a tiny component of the whole process of developing superior MT engines.&lt;/span&gt;&amp;nbsp;&lt;a href="http://lh5.ggpht.com/-1smW2zUCXtw/Ttie8RJjfZI/AAAAAAAAATE/8H4SbfoLxas/s1600-h/image3.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh5.ggpht.com/-c-pUFasP4co/Ttie84QheXI/AAAAAAAAATI/xgab2RkYZUg/image_thumb1.png?imgmax=800" style="background-image: none; border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto; padding-left: 0px; padding-right: 0px; padding-top: 0px;" title="image" width="244" /&gt;&lt;/a&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;b&gt;&lt;span style="font-family: Trebuchet MS; font-size: medium;"&gt;Control &amp;amp; Data Security&lt;/span&gt;&lt;/b&gt;&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;One of the reasons why it may make sense to use Moses sometimes is to keep your data and training and translation activity REALLY REALLY private &lt;i&gt;(e.g. translations of interrogation transcripts where persuasion involving water might be used).&lt;/i&gt; The need for security and privacy especially makes sense for national security applications, but I find it hard to understand the resistance some global companies have, to working in the cloud when a lot of this MT and PEMT content ends up on the web anyway. &lt;b&gt;For most companies cloud computing simply makes sense and spares the user from the substantial IT burden of maintaining the hardware infrastructure needed to play at the highest professional level.&lt;/b&gt; &lt;i&gt;(Asia Online actually makes it’s full training and translation environment available for on-premise installation for large enterprise customers like LexisNexis who process hundreds of millions of words a day and have suitable computing and human resource expertise to handle this&lt;/i&gt;).&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;I have heard of several LSPs who have spent $10K–$20K on servers that will probably only do Moses training once a year.&lt;b&gt; If you do not have the data to drive an improvement in your Moses engine, what is the point of having these kinds of servers?&amp;nbsp; There is no point in trying to re-train an engine when you don’t have enough new data to make any noticeable impact.&lt;/b&gt; This is a technology that just makes much more sense in the cloud, for scalability, extensibility, security and effective control. Cloud solutions are often more secure than on-premise installations at LSPs because cloud service providers can afford the IT staff that has deep expertise on computer security, data protection and data availability management. &lt;i&gt;(BTW I have also seen what happens when hacks try and manage 200 servers = not pretty&lt;/i&gt;). Like many other things in today’s world, IT (Information Technology) has become so specialized and complex that it makes more sense to outsource much of it, and work in the cloud rather than try and do it on your own with a meager and barely trained staff. Compare your IT &lt;a href="http://www.rackspace.com/managed_hosting/"&gt;staff capabilities&lt;/a&gt; to &lt;a href="http://www.voxel.net/managed-hosting"&gt;any cloud service&lt;/a&gt; provider. Even Microsoft Office is finally &lt;a href="http://office.microsoft.com/en-us/web-apps/"&gt;making the transition&lt;/a&gt; to the cloud. Some analysts are even saying that &lt;a href="http://bits.blogs.nytimes.com/2011/12/01/cloud-computing-endangers-older-tech-companies/?partner=rss&amp;amp;emc=rss"&gt;the shift to the cloud will challenge the dominance &lt;/a&gt;of older stalwarts like HP,&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt; &lt;/span&gt;&lt;/span&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;Microsoft, Intel, SAP, RIM, Oracle, Cisco, Dell&amp;nbsp; &lt;/span&gt;&lt;span style="font-family: Trebuchet MS;"&gt;and that a third of these companies may not be around in in 2020. Remember DEC and Wang? &lt;b&gt;In a world where tablets, smartphones and mobile platforms will increasingly drive global commerce, the desktop/server perspective of traditional IT is already fading, and makes less sense with each passing day. It is ironic to see LSPs jumping on the “On-Premise Server” train just as it about to reach the end of the line.&lt;/b&gt;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;Cloud based MT can also be setup to be always improving (assuming you have more than basic Moses MT) as new data is added regularly and feedback gathered from users as Google and Bing do. Setting up this kind of infrastructure is a significant undertaking and most Moses users will never get to that point, but this is how the best MT systems will continue to evolve. What some may find is, that their domain focused MT system may be better than the public engines in January, but by June this may no longer be true. You should realize that you are dealing with a moving target and most public engines will continue to improve. All the expert MT developers are constantly updating and enhancing their technology, most have already moved beyond the phrase-based SMT that Moses is today, and are incorporating linguistics in various forms. This can only be done because they understand what they are doing. Some of these enhancements may make it back to Moses years later but the productivity edge will remain with experts in the foreseeable future and I expect in 2012 we will see several case studies where expert MT systems outperform instant Moses systems by significant margins. So my advice; Be wary of any kind of instant MT solution that is not free.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;I started the eMpTy Pages blog in early 2010, and one of my earliest posts was on &lt;/span&gt;&lt;a href="http://kv-emptypages.blogspot.com/2010/02/impact-of-clean-data-on-smt.html"&gt;&lt;span style="font-family: Trebuchet MS;"&gt;the importance of clean data&lt;/span&gt;&lt;/a&gt;&lt;span style="font-family: Trebuchet MS;"&gt; for SMT.&amp;nbsp; It was blasphemy at the time to question the value of sheer data volume for SMT, but in the period since then, many have validated that working with consolidated TM from multiple sources, trusted though they may be, is a tricky affair and data quality does matter. Pooling data can work sometimes but will also fail often without cleaning and standardization.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;The origin of the phrase &lt;a href="http://www.phrases.org.uk/meanings/226950.html"&gt;“Let a thousand flowers bloom”&lt;/a&gt; is attributed to a misquote of Mao Zedong. The results for Chinese intellectuals who took Mao seriously were &lt;a href="http://en.wikipedia.org/wiki/Hundred_Flowers_Campaign"&gt;quite unfortunate&lt;/a&gt;.&amp;nbsp; Fortunately we live in better times &lt;i&gt;(I think?)&lt;/i&gt; and this phrase is not likely to have such dire consequences today. However, while a thousand MT systems may bloom &lt;i&gt;(or at least be seeded),&lt;/i&gt; I predict that many will fade and die quickly. This is not necessarily bad, as hopefully institutional, community and industry learning will take place, and some practitioners may actually discover that they now have a much better appreciation for corpus linguistics and some of the skills that drive the creation of better MT systems. The experimental evidence from many failed experiments with Moses will also provide useful information for MT experts and further enhance the state of the art and science of MT. The learning curve for this technology is long and arduous and it may take a while for the dust to settle from the current hype, but I fully expect that by &lt;a href="http://en.wikipedia.org/wiki/2012_phenomenon"&gt;December 21st, 2012&lt;/a&gt; it will be clear that expertise, experience and knowledge does matter with something as complex as Moses. Dead flowers are also used to fertilize gardens and help other plants thrive, and as long as we have the long view, we will continue to move onward and upward. &lt;b&gt;I will restate my prediction, that the best MT systems will still come from close collaboration between MT experts with linguists, translators, LSPs and insight drawn from experience and failure.&amp;nbsp; &lt;/b&gt;&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;/span&gt;&lt;br /&gt;
&lt;div align="center"&gt;
&lt;span style="color: #c0504d; font-family: Trebuchet MS; font-size: small;"&gt;&lt;i&gt;And you can send me dead flowers every morning        &lt;br /&gt;Send me dead flowers by the mail         &lt;br /&gt;Send me dead flowers to my wedding         &lt;br /&gt;And I won't forget to put roses on your grave &lt;/i&gt;&lt;/span&gt;&lt;/div&gt;
&lt;span style="font-family: Trebuchet MS;"&gt;&lt;/span&gt;&lt;br /&gt;
&lt;div class="wlWriterEditableSmartContent" id="scid:5737277B-5D6D-4f48-ABFC-DD9C333F4C5D:927ec7b9-1989-4d50-92eb-4fd0e953f398" style="display: block; float: none; margin: 0px auto; padding-bottom: 0px; padding-left: 0px; padding-right: 0px; padding-top: 0px; width: 448px;"&gt;
&lt;div id="10dbab90-286f-4782-8a3b-b9be4801c944" style="display: inline; margin: 0px; padding: 0px;"&gt;
&lt;div&gt;
&lt;a href="http://www.youtube.com/watch?v=9-kjIfx1aQo" target="_new"&gt;&lt;img alt="" galleryimg="no" onload="var downlevelDiv = document.getElementById('10dbab90-286f-4782-8a3b-b9be4801c944'); downlevelDiv.innerHTML = &amp;quot;&amp;lt;div&amp;gt;&amp;lt;object width=\&amp;quot;448\&amp;quot; height=\&amp;quot;252\&amp;quot;&amp;gt;&amp;lt;param name=\&amp;quot;movie\&amp;quot; value=\&amp;quot;http://www.youtube.com/v/9-kjIfx1aQo?hl=en&amp;amp;hd=1\&amp;quot;&amp;gt;&amp;lt;\/param&amp;gt;&amp;lt;embed src=\&amp;quot;http://www.youtube.com/v/9-kjIfx1aQo?hl=en&amp;amp;hd=1\&amp;quot; type=\&amp;quot;application/x-shockwave-flash\&amp;quot; width=\&amp;quot;448\&amp;quot; height=\&amp;quot;252\&amp;quot;&amp;gt;&amp;lt;\/embed&amp;gt;&amp;lt;\/object&amp;gt;&amp;lt;\/div&amp;gt;&amp;quot;;" src="http://lh4.ggpht.com/-JIl4kyO5Sg0/Ttie9H1XFwI/AAAAAAAAATU/9piiaEsLQbs/video70357778348b%25255B75%25255D.jpg?imgmax=800" style="border-style: none;" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;/div&gt;
&lt;div style="clear: both; font-size: .8em; width: 448px;"&gt;
A celebration for dead flowers&lt;/div&gt;
&lt;/div&gt;
&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-7715058610882400555?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/AU6aH1NEYHjSwa3i-csUiScEsp4/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/AU6aH1NEYHjSwa3i-csUiScEsp4/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/AU6aH1NEYHjSwa3i-csUiScEsp4/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/AU6aH1NEYHjSwa3i-csUiScEsp4/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=PxGEUyxVwpo:QQknmpLhQ0s:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=PxGEUyxVwpo:QQknmpLhQ0s:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=PxGEUyxVwpo:QQknmpLhQ0s:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=PxGEUyxVwpo:QQknmpLhQ0s:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/PxGEUyxVwpo" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/7715058610882400555/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/12/moses-madness-and-dead-flowers.html#comment-form" title="26 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/7715058610882400555?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/7715058610882400555?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/PxGEUyxVwpo/moses-madness-and-dead-flowers.html" title="The Moses Madness and Dead Flowers" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://1.bp.blogspot.com/-zSo5BWZKo2w/TulvNvHrAlI/AAAAAAAAATc/b4tUNitUMmQ/s72-c/MosesMadness.png" height="72" width="72" /><thr:total>26</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/12/moses-madness-and-dead-flowers.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CU8DRXk_fyp7ImA9WhRRFko.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-1224203423238032128</id><published>2011-11-29T17:37:00.001-08:00</published><updated>2011-11-30T09:24:34.747-08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2011-11-30T09:24:34.747-08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="Post-editing" /><category scheme="http://www.blogger.com/atom/ns#" term="collaboration" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><title>Wanted: A Fair and Simple Compensation Scheme for MT Post-Editing</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;As the subject of fair and equitable compensation to post-editors of MT is important to the ongoing momentum of MT, I would like to introduce some people who have examined this issue, and have made an attempt (however imperfect) to developing a solution. The initial response to many such initiatives often seems to be criticism of how the approach fails. I am hoping that the dialogue on these ideas can rise above this, to more constructive and pragmatic advice or feedback to help the continuing evolution of this approach to reach more widely accepted levels of accuracy. The MemSource approach is something that measures the effort after the work is done. Used together with other initiatives that attempt to provide some measure of the post-editing task a priori, I think it could have great value in developing new compensation models that make sense to all the stakeholders in the professional translation world. It is important to develop new ways to measure MT quality and post-editing difficulty as this will become &lt;a href="http://www.freepressrelease.eu/?p=42044"&gt;increasingly more common&lt;/a&gt; in the professional translation world. &lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;This is&amp;nbsp; a guest post by David Canek, &lt;a href="http://www.memsource.com/about-us/"&gt;CEO of MemSource Technologies&lt;/a&gt;. I have not edited David’s article other than selecting some phrases that I felt were worth highlighting for a reader who skims the page.&lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;======================================&lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&amp;nbsp;&amp;nbsp; &lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Throughout 2011 &lt;a href="http://www.memsource.com/"&gt;MemSource&lt;/a&gt;, a provider of a cloud-based translation environment and CAT tool, has run a number of workshops, exploring the impact of machine translation on the traditional translation workflow. We had lots of debates with translation buyers, LSPs, as well as translators on machine translation post-editing and specifically on how it should be compensated. We have &lt;a href="http://blog.memsource.com/download-why-not-treat-mt-as-tm-memsource-case-study-presented-at-locworld/"&gt;shared our findings&lt;/a&gt; at the 2011 Localization World in Barcelona and we thought it may be interesting to also share them here, on the eMpTy Pages blog.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Translation Buyers and MT&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
While the majority of translation buyers still need to discover machine translation, there are many organizations whose progress with MT goes beyond the pilot phase. The innovators, among them many software companies, have successfully used machine translation to make the traditional translation process more efficient. One headache still remains: A simple and fair compensation scheme for machine translation post-editing. &lt;b&gt;Today, typically a flat reduction of the “normal” translation rate is negotiated with the vendor, disregarding the actual effort of the translator spent on post-editing a specific document, let alone a specific segment. This can be rather imprecise, even unfair as MT quality can vary significantly from document to document, and of course segment to segment.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Translators and MT&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;There is a myth that all translators dislike machine translation post-editing. In fact many translators have started MT post-editing as their standard translation workflow long before anyone requested them to do so.&lt;/b&gt; They themselves chose to use MT because it helped them increase their productivity. Then, some years later, they were approached by their LSP/client regarding MT. Perhaps it went like this?&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;Dear translator,&lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;We have introduced this great new technology, it is called machine translation. It will help you speed up your translation and – by the way we will cut your rates by 30%.&lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;i&gt;All the best...&lt;/i&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Of course, none of the translators could be happy at the face of this news. The innovative translators - already using MT to speed up their translations - would not be happy because nothing would change for them except that their rates would get cut. The less innovative also had no reason to be happy – they had to adapt to a new translation method and their rates got cut – without any guarantee that the new translation workflow would actually speed up their translation process.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;LSPs and MT&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Language service providers, generally speaking, are not too fast to adopt machine translation. This may come as a surprise, as LSPs should be most interested in slashing their costs with intelligent use of MT. However, LSPs, it seems, face specific obstacles, which make MT adoption not a simple task. In contrast to translation buyers, LSPs have to cope with limited resources, yet on the other hand have to tackle multiple language pairs and subject domains, spanning across all of their clients. Training a custom MT engine in this context is a bit challenging. The available online MT services, such as Google Translate or Microsoft Translator, are perceived by many LSPs as inadequate, mainly because of “confidentiality” concerns. The – growing – minority of LSPs that have started using custom MT engines report mixed results but are generally quite optimistic about the output.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Getting the right MT technology in place is important but not enough. LSPs need to make sure that there is ROI on the new technology. That means they need to modify their translation workflow to include machine translation and most of all have to make sure the new workflow makes translating faster, i.e. cheaper. This means that they will have to renegotiate rates with their translators. All of this is far from trivial and if not done carefully, it can cause more trouble than good.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Fair Compensation for MT Post-editing&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
MT is an innovative technology that will eventually (though not equally across all language pairs and domains) make human translation faster, i.e. cheaper. It is important that all stakeholders benefit from this increased efficiency: Translation buyers, LSPs and translators.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Above all, compensation for MT post-editing should be fair. There can be different ways. Some translation buyers run regular productivity tests and, based on the results, apply a flat discount on translations supported by MT (I believe Autodesk has a fairly sophisticated approach to this). At MemSource we have tried to come up with a different, perhaps complementary, approach, which is based on the editing distance between the MT output and the post-edited translation. Indeed, quite simple. We call this the &lt;b&gt;Post-editing Analysis&lt;/b&gt;. In fact this approach is an extension of the traditional “TRADOS discount scheme”, which long ago became a standard method for analyzing translation memory matches and the related discounts in the translation industry.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Post-editing Analysis: How It Works&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
When a translation for a segment can be retrieved from translation memory (a 100% match), the translation rate for that segment is reduced – typically to just 10% of the normal rate. A similar approach can be applied to MT post-editing. If the MT output for a segment is approved by the post-editor as correct, then we can say we have a 100% match and the post-editing rate should be very moderate for that segment. If, on the other hand, the post-editing effort is heavy and the machine translated output needs to be completely rewritten for a segment, a full translation rate should be paid. In the post-editing analysis, there is, of course an entire scale ranging from 0% to 100% when calculating the similarity (editing distance) between the MT output and its post-edited version. The rates can be adjusted accordingly.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;a href="http://lh6.ggpht.com/-h7ZQEPo5j3c/TtWI2zNhjiI/AAAAAAAAASM/XeeAAeZaMw4/s1600-h/clip_image002%25255B3%25255D.jpg"&gt;&lt;img alt="clip_image002" border="0" height="53" src="http://lh4.ggpht.com/-djNCCjEJqS0/TtWI25BTsdI/AAAAAAAAASU/gHbsGlEvHUE/clip_image002_thumb.jpg?imgmax=800" style="background-image: none; border-bottom: 0px; border-left: 0px; border-right: 0px; border-top: 0px; display: inline; padding-left: 0px; padding-right: 0px; padding-top: 0px;" title="clip_image002" width="244" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
The advantages of the post-editing analysis:&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
· Simple&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
· Transparent&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
· Measurable at segment-level&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
· Extension of the established TM discount scheme&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
There are also some disadvantages. Namely, the analysis can be run only after the post-editing has been carried out, which means that any discounts can be determined only after the translation job is completed. Another objection could be that the editing distance is a simplification of the actual effort of the post-editor. Indeed, this could be valid and a more complex approach could be applied. However, our goal was to come up with a simple and efficient approach, which could be easily implemented into today’s CAT workbenches and translation environments.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;Interested to Know More and Experiment&lt;/b&gt;&lt;b&gt;?&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
More details on the MemSource Post-editing analysis, incl. a &lt;a href="http://wiki.memsource.com/wiki/Post-editing_Analysis"&gt;sample post-editing analysis&lt;/a&gt; can be found on our wiki. If you are interested to share your experiences with MT post-editing initiatives and/or find out more about our efforts in this space, sign up for a webinar, etc. write to &lt;a href="mailto:labs@memsource.com"&gt;labs@memsource.com&lt;/a&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;
&lt;!--[if gte mso 9]&gt;&lt;xml&gt;
 &lt;o:OfficeDocumentSettings&gt;
  &lt;o:AllowPNG/&gt;
 &lt;/o:OfficeDocumentSettings&gt;
&lt;/xml&gt;&lt;![endif]--&gt;&lt;!--[if gte mso 9]&gt;&lt;xml&gt;
 &lt;w:WordDocument&gt;
  &lt;w:View&gt;Normal&lt;/w:View&gt;
  &lt;w:Zoom&gt;0&lt;/w:Zoom&gt;
  &lt;w:TrackMoves/&gt;
  &lt;w:TrackFormatting/&gt;
  &lt;w:PunctuationKerning/&gt;
  &lt;w:ValidateAgainstSchemas/&gt;
  &lt;w:SaveIfXMLInvalid&gt;false&lt;/w:SaveIfXMLInvalid&gt;
  &lt;w:IgnoreMixedContent&gt;false&lt;/w:IgnoreMixedContent&gt;
  &lt;w:AlwaysShowPlaceholderText&gt;false&lt;/w:AlwaysShowPlaceholderText&gt;
  &lt;w:DoNotPromoteQF/&gt;
  &lt;w:LidThemeOther&gt;EN-US&lt;/w:LidThemeOther&gt;
  &lt;w:LidThemeAsian&gt;X-NONE&lt;/w:LidThemeAsian&gt;
  &lt;w:LidThemeComplexScript&gt;HI&lt;/w:LidThemeComplexScript&gt;
  &lt;w:Compatibility&gt;
   &lt;w:BreakWrappedTables/&gt;
   &lt;w:SnapToGridInCell/&gt;
   &lt;w:WrapTextWithPunct/&gt;
   &lt;w:UseAsianBreakRules/&gt;
   &lt;w:DontGrowAutofit/&gt;
   &lt;w:SplitPgBreakAndParaMark/&gt;
   &lt;w:EnableOpenTypeKerning/&gt;
   &lt;w:DontFlipMirrorIndents/&gt;
   &lt;w:OverrideTableStyleHps/&gt;
  &lt;/w:Compatibility&gt;
  &lt;m:mathPr&gt;
   &lt;m:mathFont m:val="Cambria Math"/&gt;
   &lt;m:brkBin m:val="before"/&gt;
   &lt;m:brkBinSub m:val="&amp;#45;-"/&gt;
   &lt;m:smallFrac m:val="off"/&gt;
   &lt;m:dispDef/&gt;
   &lt;m:lMargin m:val="0"/&gt;
   &lt;m:rMargin m:val="0"/&gt;
   &lt;m:defJc m:val="centerGroup"/&gt;
   &lt;m:wrapIndent m:val="1440"/&gt;
   &lt;m:intLim m:val="subSup"/&gt;
   &lt;m:naryLim m:val="undOvr"/&gt;
  &lt;/m:mathPr&gt;&lt;/w:WordDocument&gt;
&lt;/xml&gt;&lt;![endif]--&gt;&lt;!--[if gte mso 9]&gt;&lt;xml&gt;
 &lt;w:LatentStyles DefLockedState="false" DefUnhideWhenUsed="true"
  DefSemiHidden="true" DefQFormat="false" DefPriority="99"
  LatentStyleCount="267"&gt;
  &lt;w:LsdException Locked="false" Priority="0" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Normal"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="heading 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 7"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 8"/&gt;
  &lt;w:LsdException Locked="false" Priority="9" QFormat="true" Name="heading 9"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 7"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 8"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" Name="toc 9"/&gt;
  &lt;w:LsdException Locked="false" Priority="35" QFormat="true" Name="caption"/&gt;
  &lt;w:LsdException Locked="false" Priority="10" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Title"/&gt;
  &lt;w:LsdException Locked="false" Priority="1" Name="Default Paragraph Font"/&gt;
  &lt;w:LsdException Locked="false" Priority="11" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Subtitle"/&gt;
  &lt;w:LsdException Locked="false" Priority="22" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Strong"/&gt;
  &lt;w:LsdException Locked="false" Priority="20" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Emphasis"/&gt;
  &lt;w:LsdException Locked="false" Priority="59" SemiHidden="false"
   UnhideWhenUsed="false" Name="Table Grid"/&gt;
  &lt;w:LsdException Locked="false" UnhideWhenUsed="false" Name="Placeholder Text"/&gt;
  &lt;w:LsdException Locked="false" Priority="1" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="No Spacing"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" UnhideWhenUsed="false" Name="Revision"/&gt;
  &lt;w:LsdException Locked="false" Priority="34" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="List Paragraph"/&gt;
  &lt;w:LsdException Locked="false" Priority="29" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Quote"/&gt;
  &lt;w:LsdException Locked="false" Priority="30" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Intense Quote"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 1"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 2"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 3"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 4"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 5"/&gt;
  &lt;w:LsdException Locked="false" Priority="60" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Shading Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="61" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light List Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="62" SemiHidden="false"
   UnhideWhenUsed="false" Name="Light Grid Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="63" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 1 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="64" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Shading 2 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="65" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 1 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="66" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium List 2 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="67" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 1 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="68" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 2 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="69" SemiHidden="false"
   UnhideWhenUsed="false" Name="Medium Grid 3 Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="70" SemiHidden="false"
   UnhideWhenUsed="false" Name="Dark List Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="71" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Shading Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="72" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful List Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="73" SemiHidden="false"
   UnhideWhenUsed="false" Name="Colorful Grid Accent 6"/&gt;
  &lt;w:LsdException Locked="false" Priority="19" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Subtle Emphasis"/&gt;
  &lt;w:LsdException Locked="false" Priority="21" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Intense Emphasis"/&gt;
  &lt;w:LsdException Locked="false" Priority="31" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Subtle Reference"/&gt;
  &lt;w:LsdException Locked="false" Priority="32" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Intense Reference"/&gt;
  &lt;w:LsdException Locked="false" Priority="33" SemiHidden="false"
   UnhideWhenUsed="false" QFormat="true" Name="Book Title"/&gt;
  &lt;w:LsdException Locked="false" Priority="37" Name="Bibliography"/&gt;
  &lt;w:LsdException Locked="false" Priority="39" QFormat="true" Name="TOC Heading"/&gt;
 &lt;/w:LatentStyles&gt;
&lt;/xml&gt;&lt;![endif]--&gt;&lt;!--[if gte mso 10]&gt;
&lt;style&gt;
 /* Style Definitions */
 table.MsoNormalTable
 {mso-style-name:"Table Normal";
 mso-tstyle-rowband-size:0;
 mso-tstyle-colband-size:0;
 mso-style-noshow:yes;
 mso-style-priority:99;
 mso-style-parent:"";
 mso-padding-alt:0in 5.4pt 0in 5.4pt;
 mso-para-margin:0in;
 mso-para-margin-bottom:.0001pt;
 mso-pagination:widow-orphan;
 font-size:11.0pt;
 mso-bidi-font-size:10.0pt;
 font-family:"Calibri","sans-serif";
 mso-ascii-font-family:Calibri;
 mso-ascii-theme-font:minor-latin;
 mso-hansi-font-family:Calibri;
 mso-hansi-theme-font:minor-latin;
 mso-bidi-font-family:Mangal;
 mso-bidi-theme-font:minor-bidi;}
&lt;/style&gt;
&lt;![endif]--&gt;

&lt;br /&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://3.bp.blogspot.com/-l8jtLgR1IC0/TtZmsMuy-HI/AAAAAAAAASc/bV-ltEC3u58/s1600/DavidCanek.jpg" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" src="http://3.bp.blogspot.com/-l8jtLgR1IC0/TtZmsMuy-HI/AAAAAAAAASc/bV-ltEC3u58/s1600/DavidCanek.jpg" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="font-size: x-small;"&gt;&lt;span&gt;David Canek is
the founder and CEO of MemSource Technologies, a software company providing
cloud translation technology. David, a graduate from Translation and
Comparative Studies, received his education at Charles University, Prague,
Humboldt University in Berlin and the University of Vienna. His professional
experience includes business development and product management roles in the
software and translation industries. David is keen on pursuing innovative
trends in the translation industry, such as machine translation post-editing or
cloud-based translation technologies and has presented on these topics at
leading industry conferences, such as Localization World, Tekom, ATA and
others.&lt;/span&gt;&lt;/span&gt;&lt;/div&gt;
&lt;/div&gt;
&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-1224203423238032128?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/O1AoQjC4AjMYlxY_rTV9SAjBzMQ/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/O1AoQjC4AjMYlxY_rTV9SAjBzMQ/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/O1AoQjC4AjMYlxY_rTV9SAjBzMQ/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/O1AoQjC4AjMYlxY_rTV9SAjBzMQ/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=lLiaxPYGLwA:wkSr3C7vlyc:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=lLiaxPYGLwA:wkSr3C7vlyc:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=lLiaxPYGLwA:wkSr3C7vlyc:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=lLiaxPYGLwA:wkSr3C7vlyc:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/lLiaxPYGLwA" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/1224203423238032128/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/11/wanted-fair-and-simple-compensation.html#comment-form" title="16 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/1224203423238032128?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/1224203423238032128?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/lLiaxPYGLwA/wanted-fair-and-simple-compensation.html" title="Wanted: A Fair and Simple Compensation Scheme for MT Post-Editing" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://lh4.ggpht.com/-djNCCjEJqS0/TtWI25BTsdI/AAAAAAAAASU/gHbsGlEvHUE/s72-c/clip_image002_thumb.jpg?imgmax=800" height="72" width="72" /><thr:total>16</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/11/wanted-fair-and-simple-compensation.html</feedburner:origLink></entry><entry gd:etag="W/&quot;D08CQno7fCp7ImA9WhRSEUU.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-2956702291132537412</id><published>2011-10-28T12:08:00.001-07:00</published><updated>2011-11-13T04:04:23.404-08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2011-11-13T04:04:23.404-08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="Post-editing" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><category scheme="http://www.blogger.com/atom/ns#" term="conferences" /><title>The Building Momentum for Post-Edited Machine Translation (PEMT)</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
This is an &lt;i&gt;(opinionated)&lt;/i&gt; summary of interesting findings from a flurry of conferences that I attended earlier this month. The conferences were the TAUS User Conference, Localization World and tekom. Even though it is tiring to have so many so close together, it is interesting to see what sticks out a few weeks later. For me TAUS and tekom were clearly worthwhile, and Localization World was not, and I believe that #LWSV is an event that is &lt;a href="http://www.urbandictionary.com/define.php?term=mojo"&gt;losing it’s mojo&lt;/a&gt; in spite of big attendance numbers.&lt;/div&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Some of the big themes that stand out (mostly from TAUS) were:&lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: left;"&gt;
&lt;li&gt;Detailed case studies that provide clear and specific evidence that &lt;b&gt;customized&lt;/b&gt; MT enhances and improves the productivity of traditional (TEP) translation processes&lt;/li&gt;
&lt;li&gt;The Instant on-demand Moses MT engine parade&lt;/li&gt;
&lt;li&gt;Initial attempts at defining post-editing effort and difficulty from MemoQ and Memosource&lt;/li&gt;
&lt;li&gt;A future session on the multilingual web from speakers who actually are involved with big perspective, global web-wide changes and requirements&lt;/li&gt;
&lt;li&gt;More MT hyperbole &lt;/li&gt;
&lt;li&gt;The bigger context and content production chain for translation that is visible at tekom&lt;/li&gt;
&lt;li&gt;Post-editor feedback at tekom&lt;/li&gt;
&lt;li&gt;The lack of innovation in most of the content presented at Localization World&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&amp;nbsp;The archived twitter stream from TAUS (#tausuc11) is &lt;a href="http://www.scribd.com/doc/70688108/TAUS-User-Conference-2011-Tweets"&gt;available here&lt;/a&gt;, the tekom tag is #tcworld11 and Localization World is #lwsv. Many of the TAUS presentations will be available as web video shortly and I recommend that you check some of them out.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="font-size: large;"&gt;&lt;b&gt;PEMT Case Studies&lt;/b&gt;&lt;/span&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
In the last month I have seen several case studies that document the time and cost savings and overall consistency benefits of good customized MT systems. At TAUS, Caterpillar indicated that their demand for translation was rising rapidly and thus they instituted their famed controlled language (Caterpillar English) based translation production process using MT. &lt;b&gt;The MT process was initially more expensive since 100% of the segments needed to be reviewed but they are now seeing better results on their quality measurements from MT than from human translators on Brazilian Portuguese and Russian according to Don Johnson, Caterpillar&lt;/b&gt;. They expect to expand to new kinds of content as these engines mature.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Catherine Dove of PayPal described how the human translation process got bogged down on review and rework cycles (to ensure PayPal brand’s tone and style was intact) and was unable to meet production requirements of 15K words per week with a 3 day turnaround in 25 languages. &lt;b&gt;They found that “machine-aided human translation” delivers better, more consistent terminology in the first pass and thus they were able to focus more on style and fluency. Deadlines are easier to meet and she also commented that MT can handle tags better than humans.&lt;/b&gt; They also focus on source cleanup and improvement to leverage the MT efforts and interestingly the MT is also useful in catching errors in the authoring phase. &lt;b&gt;PayPal uses an “edit distance” measurement to determine the amount of rework and have found that the MT process reduces this effort by 20% on 8 of 10 languages they are using MT on&lt;/b&gt;. An additional benefit is that there is a new quality improvement process in place that should continue to yield increasing benefits.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
A PEMT user case study was also presented by Asia Online and Sajan at the Localization Research Conference in September 2011. The global enterprise customer is a major information technology software developer, hardware/IT OEM manufacturer, and comprehensive IT services provider for mission critical enterprise systems in 100+ countries. This company had a legacy MT system developed internally that had been used in the past by the key customer stakeholders. Sajan and Asia Online customized English to Chinese and English to Spanish engines for this customer. &lt;b&gt;These MT systems have been delivering translated output that even beats the first pass output from their human translators due to the highly technical terminology, especially in Chinese&lt;/b&gt;.&amp;nbsp; A summary of the use case is provided below: &lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: left;"&gt;
&lt;li&gt;27 million words have been processed by this client using MT &lt;/li&gt;
&lt;li&gt;Large amounts of quality TM (many millions of words) and glossaries were provided and these engines are expected to continue to improve with additional feedback.&lt;/li&gt;
&lt;li&gt;The customized engine was focused on the broad IT domain and was intended to translate new documentation and support content from English into Chinese and Spanish.&lt;/li&gt;
&lt;li&gt;A key objective of the project was to eliminate the need for full translation and limit it to MT + Post-editing as a new modified production process.&lt;/li&gt;
&lt;li&gt;The custom engine output delivered &lt;b&gt;&lt;u&gt;higher quality than their first pass human translators especially in Chinese&lt;/u&gt;&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;All output was proof read to deliver publication quality.&lt;/li&gt;
&lt;li&gt;Using Asia Online Language Studio the customer &lt;b&gt;&lt;u&gt;saved 60% in costs and 77% in time over previous production processes based on their own structured time and cost measurements. &lt;/u&gt;&lt;/b&gt;&lt;/li&gt;
&lt;li&gt;The client also produces an MT product, but the business units prefer to use Asia Online because of considerable quality and cost differences.&lt;/li&gt;
&lt;li&gt;Client extremely impressed with result especially when compared to the output of their own engine. &lt;/li&gt;
&lt;li&gt;The new pricing model enabled by MT creates a situation where the higher the volume the more beneficial the outcome.&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
The video presentation below by Sajan begins at 27 minutes &lt;i&gt;(in case you want to skip over the Asia Online part)&lt;/i&gt; and even if you only watch the Sajan presentation for 5 minutes you will get a clear sense for the benefit delivered by the PEMT process.&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;object class="BLOGGER-youtube-video" classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" codebase="http://download.macromedia.com/pub/shockwave/cabs/flash/swflash.cab#version=6,0,40,0" data-thumbnail-src="http://1.gvt0.com/vi/hjK17GWynoU/0.jpg" height="266" width="320"&gt;&lt;param name="movie" value="http://www.youtube.com/v/hjK17GWynoU&amp;fs=1&amp;source=uds" /&gt;




&lt;param name="bgcolor" value="#FFFFFF" /&gt;




&lt;embed width="320" height="266"  src="http://www.youtube.com/v/hjK17GWynoU&amp;fs=1&amp;source=uds" type="application/x-shockwave-flash"&gt;&lt;/embed&gt;&lt;/object&gt;&lt;/div&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
A session on the multilingual web at TAUS by the trio &lt;a href="http://www.translationautomation.com/taus-user-conference-2011-panel-bios.html"&gt;Bruno Fernandez Ruiz&lt;/a&gt;, Yahoo! Fellow and Vice President, &lt;a href="http://www.translationautomation.com/taus-user-conference-2011-panel-bios.html"&gt;Bill Dolan&lt;/a&gt;, Head of NLP Research, Microsoft, &lt;a href="http://www.translationautomation.com/taus-user-conference-2011-panel-bios.html"&gt;Addison Phillips&lt;/a&gt;, Chair, W3C Internationalization Group / Amazon also produced many interesting observations such as:&lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: left;"&gt;
&lt;li&gt;The impact of “Big Data” and the cloud will affect language perspectives of the future and the tools and processes of the future need to change to handle the new floating content. &lt;/li&gt;
&lt;li&gt;Future applications will be built once and go to multiple platforms (PC, Web, Mobile, Tablets)&lt;/li&gt;
&lt;li&gt;The number of small nuggets of information that need to be translated instantly will increase dramatically&lt;/li&gt;
&lt;li&gt;HTML5 will enable publishers to be much freer in information creation and transformation processes and together with CSS3 and Javascript can handle translation of flowing data across multiple platforms&lt;/li&gt;
&lt;li&gt;Semantics have not proven to be necessary to solve a lot of MT problems contrary to what many believed even 5 years ago. Big Data will help us to solve many linguistic problems that involve semantics&lt;/li&gt;
&lt;li&gt;Linking text to location and topic to find cultural meaning will become more important to developing a larger translation perspective&lt;/li&gt;
&lt;li&gt;Engagement around content happens in communities where there is a definable culture, language and values dimension&lt;/li&gt;
&lt;li&gt;While data availability continues to explode for the major languages we are seeing a digital divide for the smaller languages and users will need to engage in translation to make more content in these languages happen&lt;/li&gt;
&lt;li&gt;Even small GUI projects of 2,000 words are found to have better results with MT + crowdsourcing than with professional translation&lt;/li&gt;
&lt;li&gt;More translation will be of words and small phrases where MT + crowdsourcing can outperform HT&lt;/li&gt;
&lt;li&gt;User s need to be involved in improving MT and several choices can be presented to users to determine the “best” ones&lt;/li&gt;
&lt;li&gt;The community that cares about solving language translation problems will grow beyond the professional translation industry.&lt;/li&gt;
&lt;/ul&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
At TAUS, there were several presentations on Moses tools and instant Moses MT engines via a one or two step push button approach. While these tools facilitate the creation of “quick and dirty data” MT engines, &lt;b&gt;I am skeptical of the value of this approach for real production quality engines where the objective is provide long-term translation production productivity. As Austin Powers once said, “This is emPHASIS on the wrong syll&lt;/b&gt;&lt;b&gt;ABLE" &lt;/b&gt;My professional experience is that the key to long-term success (i.e. really good MT systems) is to really clean the data and this means more than removing formatting tags and removing the most obvious crap. This is harder than most think. Real cleaning also involves linguistic and bilingual human supervised alignment analysis. Also, I have seen that it takes perhaps thousands of attempts across many different language pairs to understand what is happening when you throw data into the hopper, and that this learning is critical to fundamental success with MT and developing continuous improvement architectures. I expect that some Moses initiatives will produce decent gist engines, but are unlikely to do much better than Google/Bing for the most part. I disagree with Jaap’s call to the community to produce thousands of MT systems, &lt;b&gt;what we really need to see are a few hundred really good, kick-ass systems, rather than thousands that do not even measure up to the free online engines.&lt;/b&gt; And so far, getting a really good MT engine is not possible without real engagement from linguists and translators and more effort than pushing a button. &lt;b&gt;We all need to be wary of instant solutions, with thousands of MT engines produced rapidly but all lacking in quality and "new" super semantic approaches that promise to solve the automated translation problem without human assistance. I predict that the best systems will still come from close collaboration with linguists and translators and insight borne from experience.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;I was also excited to see the initiative from MemoQ to establish a measure of translator productivity or post-editing effort expended, by creating an open source measurement of post-edited output, where the assumption is that an untouched segment is a good one. &lt;b&gt;MemoQ will use an open and published edit distance algorithm that could be helpful in establishing better pricing for MT post-editing &lt;/b&gt;and they also stressed the high value of terminology in building productivity. While there is already much criticism of the approach, I think this is a great first step to formulating a useful measurement. At tekom I also got a chance to see the scheme that MemSource has developed where post-edited output is mapped back to a fuzzy matching scheme to establish a more equitable post-editing pricing scheme than advocated by some LSPs. I look forward to seeing this idea spread and hope to cover it in more detail in the coming months&lt;/span&gt;.&lt;br /&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Localization World was a disappointing affair and I was struck by how mundane, unimaginative and irrelevant much of the content of the conference was. While the focus of the keynotes was apparently innovation, I found the @sarahcuda presentation interesting, but not very compelling or convincing at all in terms of insight into innovation. The second day keynote was just plain bad, filled with clichés and obvious truisms e.g. “You have to have a localization plan” or “I like to sort ideas in a funnel”. &lt;i&gt;(Somebody needs to tell Tapling that he is not the CEO anymore even though it might say so on his card)&lt;/i&gt;. I heard several others complain about the quality of many sessions, and apparently in some sessions audience members were openly upset. T&lt;b&gt;he MT sessions were really weak in comparison to TAUS and rather than broadening the discussion they succeeded in mostly making them vague and insubstantial. The most interesting (and innovative) sessions that I was witness to were the &lt;a href="http://www.fastcompany.com/1787015/smartling-ceo-jack-welde-translation-localization"&gt;Smartling use case studies&lt;/a&gt; and a pre-conference session on Social Translation.&lt;/b&gt; Both of these sessions focused on how the production model is changing and both were not particularly well attended. I am sure that there were others that were worthwhile (or maybe not), but it appears that this conference will matter less and less in terms of producing compelling and relevant content that provides value in the Web 2.0 world. This event is useful to meet with people but I truly wonder how many will attend for the quality of the content.&lt;/div&gt;
&lt;br /&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;The tekom event is a good event to get a sense for how technical business translation fits into the overall content creation chain and also see how synergies could be created within this chain. &lt;b&gt;There were many excellent sessions and it is the kind of event that helps you to broaden your perspective and understand how you fit into a bigger picture and ecosystem.&lt;/b&gt; The event has 3300 visitors so it is also a much larger perspective in terms of many different views points. I had a detailed conversation with some translators about post-editing. They were most concerned about the compensation structure and post-editor recruitment practices. &lt;b&gt;They specifically pointed out how unfair the SDL practice of paying post-editors 60% of standard rates was, and asked that more equitable and fair systems be put into place. LSPs and buyers would be wise to heed this feedback if they want to be able to recruit quality people in future&lt;/b&gt;. I got a close look at the MemSource approach to making this more fair, and I think that this approach which measures the actual work done at a segment level should be acceptable to many. This approach measures the effort after the fact. &lt;b&gt;However, we still need to do more on making the difficulty of the task before the translators begin more transparent. This begins with an understanding of how good the individual MT system is and how much effort is needed to get to production quality levels&lt;/b&gt;. This is an area that I hope to explore further in the coming weeks&lt;/span&gt;.&lt;br /&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I continue to see more progress on the PEMT front and I now have good data of measurable productivity even on a language pair as tough as English to Hungarian. I expect that a partnership of language and MT experts will be more likely to produce compelling results than many DIY initiatives, but hopefully we learn from all the efforts being made.&lt;/div&gt;
&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-2956702291132537412?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/IoB-coSBNQJs8HuUkeibGKz3MMQ/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/IoB-coSBNQJs8HuUkeibGKz3MMQ/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/IoB-coSBNQJs8HuUkeibGKz3MMQ/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/IoB-coSBNQJs8HuUkeibGKz3MMQ/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=4A-2VKC1gbs:ogWBth-rSpY:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=4A-2VKC1gbs:ogWBth-rSpY:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=4A-2VKC1gbs:ogWBth-rSpY:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=4A-2VKC1gbs:ogWBth-rSpY:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/4A-2VKC1gbs" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/2956702291132537412/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/10/building-momentum-for-post-edited.html#comment-form" title="13 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/2956702291132537412?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/2956702291132537412?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/4A-2VKC1gbs/building-momentum-for-post-edited.html" title="The Building Momentum for Post-Edited Machine Translation (PEMT)" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><thr:total>13</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/10/building-momentum-for-post-edited.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CkYNQ3c5fip7ImA9WhdUEkg.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-5222042790734914384</id><published>2011-09-27T14:28:00.001-07:00</published><updated>2011-09-28T15:49:52.926-07:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2011-09-28T15:49:52.926-07:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="crowdsourcing" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><category scheme="http://www.blogger.com/atom/ns#" term="conferences" /><title>The Growing Interest &amp; Concern About the Future of Professional Translation</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I have noticed of late that every conference has a session or two that focuses on the future. Probably because many sense that change is in the air. Some of you may also have noticed that the protest from some quarters has &lt;a href="http://www.translationtribulations.com/2011/09/future-is-here-artful-manipulation.html"&gt;grown more strident&lt;/a&gt; or even outright rude, to some of the ideas presented at these future outlook sessions. The most vocal protests seem to be directed at predictions about the increasing use of machine translation, anything about “good enough” quality and the process and production process changes necessary to deal with the increasing translation volume. (There are still some who think that &lt;a href="http://kv-emptypages.blogspot.com/2010/04/data-deluge-and-growing-need-for.html"&gt;the data deluge&lt;/a&gt; is a myth).&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Some feel personally threatened by those who speak on these subjects and rush to kill or at least stab the messenger. I think they miss the point that &lt;b&gt;what is happening in translation, is just part of a larger upheaval in the way global enterprises are interacting with customers. The forces causing change in translation are also creating upheaval in marketing, operations and product development departments as &lt;a href="http://www.cluetrain.com/book/"&gt;many analysts have remarked&lt;/a&gt; for some time now.&lt;/b&gt; The discussion in the professional translation blogosphere is polarized enough (translators vs. technology advocates) that dialogue is difficult, but hopefully we all continue to speak with increasing clarity, so that the polemic subsides. &lt;b&gt;The truth is that none of us really knows the definite future, but that should not stop us from making educated &lt;i&gt;(or even wild)&lt;/i&gt; guesses at where current trends may lead.&lt;/b&gt; &lt;i&gt;(I highly recommend you &lt;b&gt;skim &lt;a href="http://www.cluetrain.com/book/markets.html"&gt;The Cluetrain Manifesto&lt;/a&gt; &lt;/b&gt;to get a sense for the broader forces at play.)&lt;/i&gt;&lt;/div&gt;
&lt;blockquote style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Brian Solis has a new book coming out that describes the overall change quite succinctly. &lt;i&gt;&lt;a href="http://www.briansolis.com/2011/08/announcing-the-end-of-business-as-usual/"&gt;The End of Business As Usual&lt;/a&gt;&lt;/i&gt; (his new book&lt;i&gt;)&lt;/i&gt; explores each layer of the complex consumer revolution that is changing the future of business, media, and culture. &lt;b&gt;As consumers further connect with one another, a vast and efficient information network takes shape and begins to steer experiences, decisions, and markets. It is nothing short of disruptive.&lt;/b&gt;&lt;/blockquote&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I was watching the Twitter feed from two conferences last week (&lt;a href="http://www.localisation.ie/resources/conferences/2011/programme.htm"&gt;LRC XVI&lt;/a&gt; in Ireland and &lt;a href="http://tconf.com/program/"&gt;Translation Forum&lt;/a&gt; in Russia)&amp;nbsp; and I thought it would be interesting to summarize and highlight some of &lt;b&gt;the tweets as they pertain to this changing world and perhaps provide more clarity about the trends from a variety of voices and perspectives.&lt;/b&gt; &lt;b&gt;The LRC conference had several speakers from large IT companies who talked about their specific experience, as well as technology vendor and LSP presentations.&lt;/b&gt; For those who are not aware, CSA research identifies IT as one of the single largest sectors buying professional translation services. The chart below shows the sectors with the largest share of global business. This chart is also probably a good way to understand where these changes are being felt most strongly. &lt;/div&gt;
&lt;a href="http://lh5.ggpht.com/-g3BZ3W2-b1c/ToI_xoV09MI/AAAAAAAAARo/PaJzFR8mS3U/s1600-h/image%25255B2%25255D.png"&gt;&lt;img alt="image" border="0" height="130" src="http://lh6.ggpht.com/-c8Cbk2V4pKg/ToI_yEa796I/AAAAAAAAARs/uTV5w7NO3IQ/image_thumb.png?imgmax=800" style="border-bottom: 0px; border-left: 0px; border-right: 0px; border-top: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt; &lt;br /&gt;
&lt;br /&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;Here are some &lt;/span&gt;&lt;a href="http://twitter.com/#%21/search/realtime/%23lrcconf" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;Twitter highlights from LRC&lt;/a&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt; on the increasing volume of translation, changing content, improving MT and changing translation production needs. I would recommend that you check out &lt;/span&gt;&lt;a href="http://twitter.com/#%21/TheRosettaFound" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;@therosettafound&lt;/a&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt; for the most complete Twitter trail. I have made minor edits to provide context and clarify abbreviations and have attempted to provide some basic organization to the tweet trail to make it somewhat readabl&lt;/span&gt;e.&lt;br /&gt;
&lt;a href="http://lh3.ggpht.com/-Lbmf_h_Qifs/ToI_1UPnDEI/AAAAAAAAARw/Ikx2nWX4cJ8/s1600-h/image%25255B8%25255D.png"&gt;&lt;img alt="image" border="0" height="164" src="http://lh6.ggpht.com/-6W6-QG1CWjg/ToI_2kEh7KI/AAAAAAAAAR0/wSYm42UIZNU/image_thumb%25255B2%25255D.png?imgmax=800" style="border-bottom: 0px; border-left: 0px; border-right: 0px; border-top: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt; &lt;br /&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/CNGL"&gt;CNGL&lt;/a&gt; Changing content consumption and creation models require new translation and localisation models – (according to) &lt;a href="http://twitter.com/#%21/RobVandenberg"&gt;&lt;s&gt;@&lt;/s&gt;&lt;b&gt;RobVandenberg&lt;/b&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt; &lt;b&gt;We are all authors, the enterprise is going social - implications for localisation?&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/ArleLommel"&gt;ArleLommel&lt;/a&gt; &lt;b&gt;Quality even worse than Rob Vandenberg says: we have no real idea what it is/how to measure, especially in terms of customer impact&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Issue is NOT MT vs. human translation (HT). It's becoming MT AND HT. Creates new opportunities for domain experts.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Dion Wiggins. &lt;b&gt;LSPs not using MT will put themselves out of business? Prediction: yes in four/five years&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;CNGL says 25% of translators/linguists use MT. I wonder how many use it but say they don't use it due to (negative) perception (with peers)?&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Waiting for translation technology equivalent of iPhone: something that transforms what we do in ways we can't yet imagine.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
Tweets from &lt;b&gt;Jason Rickhard’s presentation on Collaborative Translation&lt;/b&gt; (i.e. Crowdsourcing) and IT go Social. &lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;Jason of Symantec giving the enterprise perspective, added 15-20 languages to small but popular product, built tech to support this. Not just linguistic but also legal, organizational issues to be resolved in collaborative, paid-for product.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Is collaborative translation bad &amp;amp; not-timely? &lt;a href="http://twitter.com/#%21/search?q=%23lrcconf"&gt;&lt;s&gt;#&lt;/s&gt;lrcconf&lt;/a&gt; Not so, a lot of translators = involved users of the content/product they translate.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Review process is different in collaborative translation. Done by voting, not by editors&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;The smaller the language gets, the more motivated volunteer translators are and the better collaborative translation works.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Is volunteering something for people who don't have to worry that their day-to-day basics are covered?&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Does collaborative translation and collaboration mean that content owners "give up the illusion of control" over their content?&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Enterprises do collaborative translation for languages they would/could not cover otherwise - true, for both profit and non-profits&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Collaborative/Community will not replace existing service providers but open up more content for more languages&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Language Service Providers could play an important role in community translation by building, supporting, moderating communities&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;It's not correct to say Community Translation = bad; Professional Translation = good&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Microsoft appoints moderators with a passion for the project/language for community localization&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;&amp;gt;1,200 users translated Symantec products into 35 languages&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
If &amp;gt;1,200 were needed to translate 2 small-ish products, how can millions of translators translating 1 ZB be 'managed'?&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/ArleLommel"&gt;ArleLommel&lt;/a&gt;&lt;u&gt; &lt;/u&gt;&lt;b&gt;Symantec research: Community involvement in support often leads to ~25% reduction in support spend&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;“Super users” are what make communities scalable. Key is to identify/cultivate them early in the process&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Jason Rickard: Dell is a good example of using Facebook for support. One of few companies with real metrics and insight in this area.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Jason Rickard: Symantec has really cool/systemic/well-thought ways to support community&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
&lt;br /&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;21st generation localisation is about the user, about user-generated content - Ellen Langer: Give up the Illusion of Control&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/ArleLommel"&gt;ArleLommel&lt;/a&gt;&lt;u&gt; &lt;/u&gt;Illusion of control? You mean we can have even less control that we have now? That's a scary thought!&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;&lt;b&gt;The most dramatic shifts driven by the web happened because communities took over - Imagine: 100000s of user translators translating billions of words into 100s of languages - control that&lt;/b&gt;!&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Seems the deep and complex problems of localisation are a minute drop in the ocean of digital content management&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/CNGL"&gt;CNGL&lt;/a&gt;&lt;u&gt; &lt;/u&gt;Discovery, analysis, transformation - Alex O'Connor tells how CNGL is addressing the grand challenges of digital content management&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;&lt;b&gt;Is the L10N industry due for a wave of destruction or positive transformation?&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/ArleLommel"&gt;ArleLommel&lt;/a&gt;&lt;u&gt; &lt;/u&gt;Yes, &lt;b&gt;Most of the mainstream technologies for translators are non-ergonomic and still in 20-year-old paradigms&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
Tweets from &lt;b&gt;Tony Allen, Product Manager Intel Localisation Solutions &lt;/b&gt;presentation&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;30+ langs &amp;gt;200k pages &amp;gt;40% localised @ Intel's web presence. &lt;b&gt;Intel: important to have user-driven content, interaction with the customer. &lt;/b&gt;Integration important, e.g. multilingual support chat. Integration, Interoperability key issues for Intel L10N. &lt;b&gt;To figure out how content flows, without loss of metadata, interoperates with internal/external range of systems, is crucial.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
2.5b netizens, &amp;gt;15b connected devices &amp;gt;1 zetabyte of traffic by 2015 and companies will interact with their customers using social media - type setups; new challenges for localization.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;&lt;a href="http://twitter.com/#%21/search?q=%23intel"&gt;&lt;s&gt;#&lt;/s&gt;intel&lt;/a&gt; What does it mean for localization infrastructures if we have &amp;gt;1 zetabyte of content in 2015? Current methods won't keep up&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/ArleLommel"&gt;ArleLommel&lt;/a&gt;&lt;u&gt; &lt;/u&gt;&lt;a href="http://twitter.com/#%21/search?q=%23intel"&gt;&lt;s&gt;#&lt;/s&gt;&lt;b&gt;intel&lt;/b&gt;&lt;/a&gt; says that interoperability standards are required for cloud to meet future demands. L10n must evolve to meet this need too.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
@&lt;a href="http://twitter.com/#%21/ArleLommel"&gt;ArleLommel&lt;/a&gt;&lt;u&gt; &lt;/u&gt;&lt;b&gt;Alison Toon (#hp) puts it this way: “localization (people) are the garbage collectors of the documentation world”&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;600GB of data in Oracle's Translation Platform - &lt;b&gt;We need concise well-structured content - then we're going to be able to deliver efficient translation services&lt;/b&gt; - How to get it right: analyze content, identify problems and throw it back into the face of writers and developers. &lt;b&gt;I18N and l10n have to get into the core curriculum at Universities says Paul Leahy (of Oracle), since we spend too much time teaching it.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
Tweets from &lt;b&gt;Sajan / Asia Online MT presentation&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;MT cannot perform magic on bad source text - user-generated non-native-speaker content is often 'bad'&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
MT errors make me laugh... but human errors make me cry - an old quote from previously recycled presentations... Asia Online&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Dirty Data SMT - what kind of translations would you expect? If there are no humans involved you are training on dirty data, says Asia Online. Sajan achieved 60% reduction in costs and 77% time savings for specific project &lt;/b&gt;- a miracle? Probably no, let’s see.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Millions of words faster, cheaper, better translated by Sajan using Asia Online - is this phenomenal success transferable? How? &lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
XLIFF contributed to the success of Sajan/Asia Online's MT project. &lt;b&gt;Asia Online's process rejected 26% of TM training data.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
Tweets from &lt;b&gt;Martin Orsted, Microsoft &lt;/b&gt;presentation&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;Cloud will lead to improved cycle times and scalability: 100+ languages, millions of words&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Extraordinary scale: 106 languages for the next version of Office. Need a process that scales up &amp;amp; down in proportion.&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Microsoft: We have fewer people than ever and we are doing more and more languages than ever&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Martin: "The Language Game - Make it fun to review Office"... here is a challenge :) Great idea to involve community via game&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
How can a "Game" approach be used for translation? Levels of experience, quality, domains, complexity; rewards?&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;No more 'stop &amp;amp; go', just let it flow &lt;a href="http://twitter.com/#%21/search?q=%23lrcconf"&gt;@robvandenburg&lt;/a&gt; &amp;gt;&amp;gt;Continuous publishing requires continuous translation. New workflows&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
Tweets from Derek Coffey, Welocalize presentation Are we the FedEx or the WallMart of words?&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;&lt;b&gt;TMS of SDL = burning stacks of cash - Reality: we support your XLIFF, but not your implementation&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Lack of collaboration, workflow integration, content integration = most important bottle necks&lt;/b&gt;. Welocalize, MemoQ, Kilgray and Ontram working on &lt;a href="http://interoperability-now.org/tiki/"&gt;reference implementation&lt;/a&gt; - Derek: Make it compelling for translators to work for us&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
It's all about the translators and they will seek to maximise their earning potential according to Derek. &lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;
Tweets from Future Panel&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
@&lt;a href="http://twitter.com/#%21/TheRosettaFound"&gt;TheRosettaFound&lt;/a&gt;&lt;u&gt; &lt;/u&gt;Many translators don't know what XML looks like &lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Rob: more collaborative, community translation - Rob: Users who consume content will have a large input into the translation BINGO&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Tony: users will drive localisation decision, translation live&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Derek: future is in cooking xxx? Open up a whole new market - user generated, currently untranslatable content. HUGE market&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Derek: need to re-invent our industry, with focus on supply chain&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
The end of the big projects - how are we going to make money (question from audience)&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;From service/product to community - the radical change for enterprises, according to Fred&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
No spark, big bang, revolution - but continuous change, Derek&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Big Spark (Dion): &lt;b&gt;English will no longer remain the almost exclusive source language&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;a href="http://lh6.ggpht.com/-E4GeAJzoqnI/ToI_4M4LSyI/AAAAAAAAAR4/tuJRsK3DLMg/s1600-h/image%25255B5%25255D.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh3.ggpht.com/-4i2Oo5GwqkA/ToI_4hd2mMI/AAAAAAAAAR8/kGEG0vhyiKo/image_thumb%25255B1%25255D.png?imgmax=800" style="border-bottom: 0px; border-left: 0px; border-right: 0px; border-top: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt;&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
The &lt;a href="http://twitter.com/#%21/search/realtime/%23tfru"&gt;Translation Forum Russia twitter trail&lt;/a&gt; has a much more translator oriented focus and is also bilingual. Here are some highlights below, again with minor edits to improve readability.&lt;/div&gt;
&lt;br /&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;a href="http://twitter.com/#%21/antonkunin"&gt;@antonkunin&lt;/a&gt; &lt;b&gt;Listened to an information-packed keynote by &lt;a href="http://twitter.com/#%21/Doug_Lawrence"&gt;&lt;strike&gt;&lt;s&gt;@&lt;/s&gt;&lt;/strike&gt;&lt;/a&gt;&lt;a href="http://twitter.com/#%21/Doug_Lawrence"&gt;Doug_Lawrence&lt;/a&gt; at &lt;a href="http://twitter.com/#%21/search?q=%23tfru"&gt;&lt;s&gt;#&lt;/s&gt;tfru&lt;/a&gt; this morning. As rates keep falling, translators' income keeps rising.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;a href="http://twitter.com/#%21/ilbarbaro"&gt;@ilbarbaro&lt;/a&gt; Talking about "the art of interpreting and translation" in the last quarter of 2011 is definitely outdated&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Language and "quality" are important for translators, speed and competence for (final) clients. Really?&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Translators are the weakest link in the translation process&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Bert: here and now translation more important than perfect translation&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Bert on fan subbing as an unstoppable new trend in translation&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Is Bert anticipating my conclusions? Noah's ark was made and run by amateurs, RMS Titanic by professionals&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Carlos Incharraulde: terminology is pivotal in translators training &amp;lt; Primarily as a knowledge transfer tool&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
To renatobeninatto at who said: Translation companies can do without process standards &amp;lt; I don't agree&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;a href="http://twitter.com/#%21/renatobeninatto"&gt;&lt;s&gt;@&lt;/s&gt;renatobeninatto&lt;/a&gt;: Start looking at income rather than price/rates &lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;Evaluating translation is like evaluating haircuts - it's better to be good on time than perfect too late&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Few translation companies do like airlines: 1st class/ Economy/ Discount rates – Esselink&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Traditional translation models only deal w/ tip of iceberg. New models required for other 90%. Esselink&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
Good enough revolution. Good enough translation for Wikileaks, for example. Bert Esselink&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;In 2007 English Russian was $0.22 per word, in 2010 it dropped to $0.16 &lt;a href="http://twitter.com/#%21/Doug_Lawrence"&gt;&lt;s&gt;@&lt;/s&gt;Doug_Lawrence&lt;/a&gt;&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;b&gt;There's much talk on innovation but not much action - don't expect SDL and Lionbridge to be innovative&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;a href="http://twitter.com/#%21/Doug_Lawrence"&gt;&lt;s&gt;@&lt;/s&gt;Doug_Lawrence&lt;/a&gt; all languages except German and French decreased in pricing from 2007 to 2010&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;a href="http://twitter.com/#%21/AndreyLeites"&gt;@AndreyLeites&lt;/a&gt; &lt;s&gt;@&lt;/s&gt;ilbarbaro problem-solving is the most important feature translator should acquire - &lt;b&gt;Don't teach translators technology, teach them to solve problems &lt;/b&gt;- language is a technology, we need to learn how to use it like technology - &lt;b&gt;85% of translators are still women&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;s&gt;@&lt;/s&gt;ilbarbaro 3 points on quality: &lt;b&gt;1. Quality is never absolute, 2. Quality is defined by the customer, 3. Quality can be measured - it is necessary to learn to define quality requirements (precisely)&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: Times,&amp;quot;Times New Roman&amp;quot;,serif;"&gt;
&lt;a href="http://twitter.com/#%21/Kilgraymemoq"&gt;&lt;s&gt;@&lt;/s&gt;Kilgraymemoq&lt;/a&gt; announces that they will open Kilgray Russia before the end of the year&lt;/div&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
This is of course my biased extraction from the stream, but the original Twitter trail will be there for a few more weeks and you can check it out yourself. It is clear to me from seeing the comments above, that at the enterprise level, MT and Community initiatives will continue to gather momentum.&amp;nbsp; Translation volumes will continue to rise and production processes will have to change to adapt to this. Also, I believe, there are translators who are seeking ways to add value in this changing world and I hope that they will provide the example that leads the way in this changing flux.&lt;br /&gt;
&lt;br /&gt;
And for a completely different view of "the future" check this out. &lt;br /&gt;
&lt;br /&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;object class="BLOGGER-youtube-video" classid="clsid:D27CDB6E-AE6D-11cf-96B8-444553540000" codebase="http://download.macromedia.com/pub/shockwave/cabs/flash/swflash.cab#version=6,0,40,0" data-thumbnail-src="http://2.gvt0.com/vi/FmYJFlAuF84/0.jpg" height="266" width="320"&gt;&lt;param name="movie" value="http://www.youtube.com/v/FmYJFlAuF84&amp;fs=1&amp;source=uds" /&gt;



&lt;param name="bgcolor" value="#FFFFFF" /&gt;



&lt;embed width="320" height="266"  src="http://www.youtube.com/v/FmYJFlAuF84&amp;fs=1&amp;source=uds" type="application/x-shockwave-flash"&gt;&lt;/embed&gt;&lt;/object&gt;&lt;/div&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;/div&gt;
&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-5222042790734914384?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/QiTWzjkDh3xhT0c36n57eBCY0Is/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/QiTWzjkDh3xhT0c36n57eBCY0Is/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/QiTWzjkDh3xhT0c36n57eBCY0Is/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/QiTWzjkDh3xhT0c36n57eBCY0Is/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=jxFpgg4cZZo:DlArT_EbLRI:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=jxFpgg4cZZo:DlArT_EbLRI:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=jxFpgg4cZZo:DlArT_EbLRI:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=jxFpgg4cZZo:DlArT_EbLRI:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/jxFpgg4cZZo" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/5222042790734914384/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/09/growing-interest-concern-about-future.html#comment-form" title="12 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/5222042790734914384?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/5222042790734914384?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/jxFpgg4cZZo/growing-interest-concern-about-future.html" title="The Growing Interest &amp;amp; Concern About the Future of Professional Translation" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://lh6.ggpht.com/-c8Cbk2V4pKg/ToI_yEa796I/AAAAAAAAARs/uTV5w7NO3IQ/s72-c/image_thumb.png?imgmax=800" height="72" width="72" /><thr:total>12</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/09/growing-interest-concern-about-future.html</feedburner:origLink></entry><entry gd:etag="W/&quot;C0YNRn8zeSp7ImA9WhdWGEo.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-7080338463633267994</id><published>2011-09-12T16:22:00.001-07:00</published><updated>2011-09-12T16:46:37.181-07:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2011-09-12T16:46:37.181-07:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="standards" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><title>Understanding Where Machine Translation (MT) Makes Sense</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;One of the reasons that many find MT threatening I think, is the claim by some MT enthusiasts that it that it will do EXACTLY the same work that was previously done by multiple individuals in the “translate-edit-proof” chain without the humans, of course. To the best of my knowledge this is not possible today, even though one may produce an occasional sentence where this does indeed happen. &lt;/span&gt;&lt;b style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;If you want final output that is indistinguishable from competent human translation, then you are going to have to use the human “edit-proof” chain to make this happen&lt;/b&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;.&lt;/span&gt; &lt;br /&gt;
&lt;div align="center"&gt;
&lt;a href="http://lh5.ggpht.com/-cgJF45UQgvU/Tm6T6p3UskI/AAAAAAAAAQw/1laa-iBeSRQ/s1600-h/image20.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh6.ggpht.com/-zcbOFLf8_Fo/Tm6T7HvHhYI/AAAAAAAAAQ0/gBQ-KZw1n4w/image_thumb6.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: inline;" title="image" width="244" /&gt;&lt;/a&gt; &lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Some in the industry have attempted to restate the potential of MT from Fully Automated High Quality Translation - FAHQT &lt;i&gt;(Notice how that sounds suspiciously like f*&amp;amp;ked?)&lt;/i&gt; to Fully Automated Useful Translation – FAUT. However, in some highly technical domains it is actually possible to see that carefully customized MT systems can outperform exclusively human-based production, because it is simply not possible to find as many competent technical translators as are required to get the work done.&lt;/div&gt;
&lt;div align="center"&gt;
&lt;a href="http://lh6.ggpht.com/-dVATKa7jU6M/Tm6T7fUOz8I/AAAAAAAAAQ4/62YsqnMgiR8/s1600-h/image23.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh6.ggpht.com/-5WnNWcmCbg4/Tm6T73ucX3I/AAAAAAAAAQ8/hWCExtomuNw/image_thumb7.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: inline;" title="image" width="244" /&gt;&lt;/a&gt; &lt;/div&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
We have seen that both Google and Bing have gotten dramatically better since they switched from RbMT to statistical data-driven approaches, but the free MT solutions have yet to deliver real compelling quality outside of some Romance languages, and the quality is usually far from competent human translation. They also offer very little in terms of control, even if you are not concerned about the serious data privacy issues that their use brings to the user. &lt;b&gt;It is usually worthwhile for professionals to work with specialists who can help them customize these systems to the specific purpose they are intended for&lt;/b&gt;. MT systems evolve and can get better with with small amounts of corrective feedback if they are designed from the outset to do this. &lt;b&gt;Somebody who has built thousands of MT systems, across many language combinations, is likely to offer more value and skill than most can get from using tools like Moses building a handful of systems, or even the limited dictionary building input possible with many RbMT systems.&lt;/b&gt; And how much better can customized systems get than the free systems? Depending on the data volume and quality, it can range from small but very meaningful improvements to significantly better overall quality.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
So where does MT make most sense? &lt;b&gt;Given that there is a significant effort required to customize an MT system, it usually makes most sense when you have ongoing high volume, dynamically created source data and tolerant users or any combination thereof.&lt;/b&gt; It is also important to understand that the higher the quality requirements, the greater the need for human editing and proofing. The graphic below elaborates on this.&lt;/div&gt;
&lt;a href="http://lh3.ggpht.com/-RhG8lqlzrVo/Tm6T8GIY1BI/AAAAAAAAARA/g0xcYp0FUPc/s1600-h/image2.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh6.ggpht.com/-6l-DU9-5CgM/Tm6T8hPBUUI/AAAAAAAAARE/U9CaSyXUbPY/image_thumb.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt;   &lt;br /&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
While MT is unlikely to replace human beings in any application where quality is really important, there are a growing number of cases that show that MT is suitable for:&lt;/div&gt;
&lt;ul style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: left;"&gt;
&lt;li&gt;Highly repetitive content where productivity gains with MT can exceed what is possible with just using TM alone&lt;/li&gt;
&lt;li&gt;Content that would just not get translated otherwise &lt;/li&gt;
&lt;li&gt;Content that simply cannot afford human translation &lt;/li&gt;
&lt;li&gt;High value content that is changing every hour and every day but has a short shelf life &lt;/li&gt;
&lt;li&gt;Knowledge content that facilitates and enhances the global spread of critical knowledge, especially for health and social services&lt;/li&gt;
&lt;li&gt;Content that is created to enhance and accelerate communication with global customers who prefer a self-service model&lt;/li&gt;
&lt;li&gt;Real-time customer conversations in social networks and customer support scenarios&lt;/li&gt;
&lt;li&gt;Content that does not need to be perfect but just approximately understandable&lt;/li&gt;
&lt;/ul&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
So while there are some who would say that MT can be used anywhere and everywhere, I would suggest that a better fit for professional use is where you have ongoing volume, and dynamic but high value source content that can enhance international initiatives. To my mind, customized MT does not make sense for one-time, small localization projects where the customization efforts cannot be leveraged frequently. Free online MT might still prove of some value in these cases, to boost productivity, &lt;b&gt;but as language service providers learn to better use and steer MT, I expect that we will see that they will provide translators access to “highly customized internal systems”&amp;nbsp; for project work, and the value to the translators will be very similar to the value provided by high quality translation memory.&lt;/b&gt;&amp;nbsp; Simply put – it can and will boost productivity even for things like user documentation and software interfaces.&lt;/div&gt;
&lt;a href="http://lh4.ggpht.com/-RNv_JWlCnJw/Tm6T9N4tuEI/AAAAAAAAARI/AnnRQfKQs-Y/s1600-h/image5.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh5.ggpht.com/-UNSd5Bq_vPI/Tm6T9VMF5eI/AAAAAAAAARM/v6lrpczHHMA/image_thumb1.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt; &lt;br /&gt;
&lt;div align="left"&gt;
&lt;br /&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;It is worth understanding that while “good” MT systems can enhance translator productivity in traditional localization projects, they can also enable completely new kinds of translation projects that have larger volumes and much more dynamic content. While we can expect that these systems will continue to improve in quality, they are not likely to produce TEP equivalent output. I expect that these new applications will be a major source for work in the professional translation industry but will require production models that differ from traditional TEP production&lt;/span&gt;.&lt;/div&gt;
&lt;div align="left"&gt;
&lt;a href="http://lh6.ggpht.com/-INusL-1yafg/Tm6T9hAJUHI/AAAAAAAAARQ/Ekc9PvhmGHQ/s1600-h/image8.png"&gt;&lt;img alt="image" border="0" height="184" src="http://lh4.ggpht.com/-lN6o-iLWOH8/Tm6T-ExBdDI/AAAAAAAAARU/nPPMj5DJgMs/image_thumb2.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt;&amp;nbsp; &lt;a href="http://lh5.ggpht.com/-w89XpVLKW_4/Tm6T-_LX56I/AAAAAAAAARY/XCWPz83Qxmc/s1600-h/image17.png"&gt;&lt;img alt="image" border="0" height="115" src="http://lh4.ggpht.com/-Fwm-oP4UQho/Tm6T_MtVLbI/AAAAAAAAARc/rFtHKgoA0Tw/image_thumb5.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="244" /&gt;&lt;/a&gt;     &lt;br /&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
However, we are still at a point in time where there is not a lot of clarity on what post-editing, linguistic steering and MT engine refinement really involve. They do in fact involve many of the same things that are of value in standard localization processes , e.g. unknown word resolution, terminological consistency, DNT lists and style adjustments. They also increasingly include new kinds of linguistic steering designed to “train” the MT system to learn from historical error patterns and corrections. &lt;b&gt;Unfortunately many of the prescriptions on post-editing principles available on LinkedIn and translator forums, are either linked to older generation MT systems (RbMT), systems that really cannot improve much beyond a very limited point or are linked to a specific MT system. In the age of data-driven systems new approaches are necessary and we have only just begun to define this.&lt;/b&gt; These new hybrid systems also allow translators and linguists to create linguistic and grammar rules around the pure data patterns. Hopefully we will see much better “user-friendly” post-editing environments that bring powerful error detection and correction utilities into much more linguistically logical and pro-active feedback loops. These tools can only emerge if more savvy translators are involved (and properly compensated) and we successfully liberate translators from dealing with the horrors of file and format conversions and other non-linguistic tedium that translation today requires. This shift to a mostly linguistic focus could also be much easier with better data interchange standards. &lt;a href="http://blogs.msdn.com/b/translation/archive/2011/06/06/announcement-new-microsoft-translator-release-delivers-community-tools-to-customize-translations-and-api-enhancements.aspx"&gt;The best examples&lt;/a&gt; of these are from Google and &lt;a href="http://blogs.msdn.com/b/translation/archive/2010/03/15/collaborative-translations-announcing-the-next-version-of-microsoft-translator-technology-v2-apis-and-widget.aspx"&gt;Microsoft&lt;/a&gt; rather than the translation industry, thus far.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;a href="http://lh4.ggpht.com/-DSG38MUudsk/Tm6UHhkXnKI/AAAAAAAAARg/gr7Gd_NWdnM/s1600-h/image26.png"&gt;&lt;img alt="image" border="0" height="55" src="http://lh5.ggpht.com/-GKg0Z1V1UGw/Tm6UH91jTBI/AAAAAAAAARk/3Rkoy060RVY/image_thumb8.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="image" width="207" /&gt;&lt;/a&gt;     &lt;br /&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Talking about standards, possibly &lt;a href="http://www.tm-europe.org/content/2nd-international-xliff-symposium-programme"&gt;the most worthwhile of the initiatives focusing on translation data interchange standards&lt;/a&gt; is meeting in Warsaw later this month. The XLIFF symposium IMO is the most concrete and most practical standards discussion going on at the moment and includes academics, LSPs, TAUS, tools vendors and large buyers sharing experiences. The future is all about data flowing in and out of translation processes and we all stand to benefit from real, robust standards that work for all constituencies. &lt;/div&gt;
&lt;/div&gt;
&lt;/div&gt;
&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-7080338463633267994?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/CLQGhP8nhOZa55MGAIdTHNyg1DE/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/CLQGhP8nhOZa55MGAIdTHNyg1DE/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/CLQGhP8nhOZa55MGAIdTHNyg1DE/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/CLQGhP8nhOZa55MGAIdTHNyg1DE/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=KZYnf8BS_oE:VcKLfCIbYAU:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=KZYnf8BS_oE:VcKLfCIbYAU:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=KZYnf8BS_oE:VcKLfCIbYAU:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=KZYnf8BS_oE:VcKLfCIbYAU:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/KZYnf8BS_oE" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/7080338463633267994/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/09/understanding-where-machine-translation.html#comment-form" title="5 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/7080338463633267994?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/7080338463633267994?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/KZYnf8BS_oE/understanding-where-machine-translation.html" title="Understanding Where Machine Translation (MT) Makes Sense" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://lh6.ggpht.com/-zcbOFLf8_Fo/Tm6T7HvHhYI/AAAAAAAAAQ0/gBQ-KZw1n4w/s72-c/image_thumb6.png?imgmax=800" height="72" width="72" /><thr:total>5</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/09/understanding-where-machine-translation.html</feedburner:origLink></entry><entry gd:etag="W/&quot;CEEESHs9cCp7ImA9WhdVF04.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-12580934454006820</id><published>2011-09-05T10:12:00.001-07:00</published><updated>2011-09-22T16:03:29.568-07:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2011-09-22T16:03:29.568-07:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="Post-editing" /><category scheme="http://www.blogger.com/atom/ns#" term="collaboration" /><category scheme="http://www.blogger.com/atom/ns#" term="innovation" /><category scheme="http://www.blogger.com/atom/ns#" term="statistical  MT" /><category scheme="http://www.blogger.com/atom/ns#" term="translation technology" /><category scheme="http://www.blogger.com/atom/ns#" term="conferences" /><title>The Continuing Saga &amp; Evolution of Machine Translation</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I recently attended the 7th IMTT Conference in Cordoba, Argentina. I especially enjoy the IMTT events because somehow they have found a content formula that works for both translators and &lt;a href="http://www.milengo.com/how-four-translation-specialists-worked-together-to-create-the-next-generation-of-lsp/"&gt;LSPs&lt;/a&gt;. You get to see the translation supply chain communicate in real-time. &lt;b&gt;The overall culture of their events is also usually very collaborative, and to my mind the place to see the most open and constructive dialogue between translators and agencies.&lt;/b&gt; Some may not be aware that Argentina has a particularly strong concentration of skilled humans who understand the mechanics of localization (especially in FIGS BrPt), and many of the agencies, even small ones, are able to work with pretty much every TM and TMS (Translation Management System) system in the market with more than a basic level of competence. Because of historical decisions made by @RenatoBeninatto many years ago and a great university educational system, Argentina has become a place with a comprehensive and sizable professional translation eco-system.&lt;/div&gt;
&lt;a href="http://lh5.ggpht.com/-2hJg1dzk5QM/TmUC-e9qF5I/AAAAAAAAAQI/iAFLPl52Hwg/s1600-h/317201_10150297433683886_25478884388.jpg"&gt;&lt;img alt="317201_10150297433683886_254788843885_7822180_1515745_n" border="0" height="184" src="http://lh5.ggpht.com/-OELDJGLd724/TmUC-jBJa0I/AAAAAAAAAQM/AHTo9EBetuw/317201_10150297433683886_25478884388%25255B1%25255D.jpg?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="317201_10150297433683886_254788843885_7822180_1515745_n" width="244" /&gt;&lt;/a&gt;   &lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
There were a few presentations that I found especially interesting, including a plenary presentation by &lt;a href="http://www.imtt.com.ar/2011conference/front/index.asp?ID=39&amp;amp;Lang=En#Suzanne_de_Santamarina"&gt;Suzanne de Santamarina&lt;/a&gt; on the use of quality metrics. You can see some of &lt;a href="http://friendfeed.com/search?q=imtt7&amp;amp;from=kvroy"&gt;the twitter trail here&lt;/a&gt; and &lt;a href="http://www.scribd.com/doc/63215305/IMTT-Conference-%E2%80%93-Twitter-feed"&gt;here&lt;/a&gt; but basically Suzanne described her very active use of &lt;a href="http://www.l10nworks.com/forum/default.aspx?g=posts&amp;amp;t=93"&gt;J2450&lt;/a&gt; measurements to improve the dialogue on quality with customers and with her translators. While there clearly is effort and expense involved in implementing this as actively as she has, I think it dramatically improves the conversation regarding translation quality between all the participants, as it is very specific and impersonal and clear about what quality means.&amp;nbsp; It is also a means to build what she called “customer delight” which of course also includes a major service component. &lt;/div&gt;
&lt;blockquote style="color: #4c1130; font-family: Verdana,sans-serif;"&gt;
&lt;div align="right"&gt;
Quality in a product or service is not what the supplier puts in. &lt;b&gt;It is what the customer gets out (of the product/service) and is willing to pay for&lt;/b&gt;. A product is not quality because it is hard to make and costs a lot of money, as manufacturers typically believe. This is incompetence. Customers pay only for what is of use to them and gives them value. Nothing else constitutes quality…         &lt;br /&gt;
~ Peter Drucker&lt;/div&gt;
&lt;/blockquote&gt;
&lt;a href="http://lh6.ggpht.com/-UUWqj6Lxifo/TmUC_AtI9VI/AAAAAAAAAQQ/Q457N9snKqo/s1600-h/j24502.jpg"&gt;&lt;img alt="j2450" border="0" height="244" src="http://lh5.ggpht.com/-rkCXyTdBWJ4/TmUC_Uk6ymI/AAAAAAAAAQU/pgMyJnmWP6s/j2450_thumb.jpg?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="j2450" width="194" /&gt;&lt;/a&gt; &lt;br /&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;Asia Online makes a software tool available to enable customers to calculate J2450 scores for this very reason.&amp;nbsp; It helps to move the discussion from inactionable complaints like “I don’t like the quality” or “the quality is not good”,&amp;nbsp; to practical error identification and resolution action steps like&amp;nbsp; “Is there a way to reduce frequency of the wrong terminology errors in the system?” Just as proper use of BLEU scores requires care and some expertise so does the use of J2450. Suzanne’s company’s regular and highly structured use of J2450 is such that they can really assess the linguistic quality from project to project with a precision that&amp;nbsp; few have. Her approach is refreshing in its clarity and precision and quite a contrast form the meandering inconclusive discussions on “quality” that you see in LinkedIn. &lt;/span&gt;&lt;b&gt;&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;Tools like BLEU and J2450 depend on the skill level of the user, and require an investment of time and effort and repeated use to develop real user competence before one understands the informational insights that their use can provide&lt;/span&gt;.&lt;/b&gt;&lt;br /&gt;
&lt;a href="http://lh6.ggpht.com/-3yF-Pon0dDM/TmUC_6K5XII/AAAAAAAAAQY/Gu3PKr-kBfM/s1600-h/HumanQualityAssessment2.png"&gt;&lt;img alt="Human Quality Assessment" border="0" height="174" src="http://lh5.ggpht.com/-Zc9tR3k7h6I/TmUDAQ-uB9I/AAAAAAAAAQc/JODA6X7IunE/HumanQualityAssessment_thumb.png?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="Human Quality Assessment" width="244" /&gt;&lt;/a&gt;   &lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I also enjoyed the presentations by master translators like &lt;a href="http://www.imtt.com.ar/2011conference/front/index.asp?ID=39&amp;amp;Lang=En#Joao_Roque_Dias"&gt;João Roque Dias&lt;/a&gt; and &lt;a href="http://www.imtt.com.ar/2011conference/front/index.asp?ID=39&amp;amp;Lang=En#Danilo_Nogueira"&gt;Danilo Nogueira&lt;/a&gt;&amp;nbsp; on the craft and art of translation, and enjoyed talking to them about MT and the life of the translator in general. &lt;i&gt;(Yes, MT is sometimes useful even for some of them.) &lt;/i&gt;There were several skill focused presentations on Language QA tools, CAT and collaborative tools that were also very interesting. I heard great things about &lt;a href="http://www.imtt.com.ar/2011conference/front/index.asp?ID=39&amp;amp;Lang=En#Val_Ivonica"&gt;Val Ivonica&lt;/a&gt;’s presentation &lt;i&gt;(in Brazilian&lt;/i&gt;) on translation productivity tools which I was unable to attend as it coincided with mine. It is interesting that &lt;a href="http://www.imtt.com.ar/2011conference/front/index.asp?ID=39&amp;amp;Lang=En#Patricia_Brown"&gt;Patricia Bown&lt;/a&gt; positioned MemoQ as collaboration software that enables the linear &lt;a href="http://www.dqglossary.com/simple/thoughtData/4010.html"&gt;TEP&lt;/a&gt; model to evolve, enabling faster turnaround and higher volume. There were many Brazilians present &lt;i&gt;(though some said not enough)&lt;/i&gt; and they lived up to their reputation for revelry but unfortunately were thwarted in their &lt;i&gt;(our)&lt;/i&gt; attempts to find a karaoke place one evening. Nevertheless they shared their linguistically oriented humor with me and I had no difficulty finding a willing interpreter even though I was often the only person who did not speak the language.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I delivered a presentation on the emerging role of MT as a means to deal with the translation challenges created by the content explosion and new kinds of dynamic product/business related content. The feedback I received was mostly positive and constructive even though there were several very skeptical translators in the crowd. There were some in the audience who have already experienced MT that works and even those who had not worked with customized systems admitted that sometimes MT was useful.&amp;nbsp; I was also on a panel on &lt;b&gt;“The Future of the Industry”&lt;/b&gt; which got mixed reviews as some translators felt it was not relevant and others felt it was a tired topic that nobody had any real clarity on. Many feel change is coming but are not clear what this really means and unfortunately for many the end-result of these changes is that customers expect more work for less money. This does mean that there is a certain amount of apprehension amongst the attendees as the future is not quite predictable.&lt;/div&gt;
&lt;a href="http://lh4.ggpht.com/-hyvNAcGfcsE/TmUDAr4EdBI/AAAAAAAAAQg/bs8qOOYhCDo/s1600-h/313481_10150297437053886_25478884388%25255B1%25255D.jpg"&gt;&lt;img alt="313481_10150297437053886_254788843885_7822203_7110892_n" border="0" height="184" src="http://lh5.ggpht.com/-t5XKxFViIN4/TmUDBHdj73I/AAAAAAAAAQk/0-4SotBgixQ/313481_10150297437053886_25478884388.jpg?imgmax=800" style="border-bottom-width: 0px; border-left-width: 0px; border-right-width: 0px; border-top-width: 0px; display: block; float: none; margin-left: auto; margin-right: auto;" title="313481_10150297437053886_254788843885_7822203_7110892_n" width="244" /&gt;&lt;/a&gt; &lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
A &lt;a href="http://winandwinnow.com/blog/?p=593"&gt;blog entry by Emily Stewart&lt;/a&gt; that pondered upon the theme of technology driven change at the conference a few days later, triggered &lt;a href="http://lnkd.in/ni_pTk"&gt;an interesting and on-going discussion&lt;/a&gt; in LinkedIn.&amp;nbsp; Her post which was about the advent of technology in a variety of different markets is thoughtful and worth reading. I also think her conclusion &lt;i&gt;(shown below)&lt;/i&gt; is good advice for us all.&lt;/div&gt;
&lt;blockquote style="color: purple; font-family: Verdana,sans-serif;"&gt;
Instead of denouncing &lt;a href="http://research.microsoft.com/en-us/projects/mt/"&gt;machine translation&lt;/a&gt; as the end of the translation world as we know it, it may be time to take a step back and see what happens.&amp;nbsp; The discussion shouldn’t stop, but perhaps it could become less polemic and instead convert into a deeper conversation on and reflection of what may or may not lie ahead.&lt;/blockquote&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
While initially there is a lot of focus on the perceived threat &lt;i&gt;(there are some who think that I, together with other over zealous MT developers, am responsible for some of this fear and FUD&lt;/i&gt;), I am hoping that the dialogue moves beyond this point. Some MT systems have indeed been used to push rates down unfairly, but as we all begin to better understand these early mishaps, this can and must change. As &lt;a href="http://www.youtube.com/watch?v=eKgPY1adc0A"&gt;George W Bush misspoke&lt;/a&gt; when he tried to say "Fool me once, shame on you; Fool me twice, shame on me."&amp;nbsp; &lt;i&gt;(I hope you click on the Bush video, it is toooo funny).&lt;/i&gt; If it becomes clearer to everybody what it actually takes to “finish off” MT output to required target quality levels, this kind of abuse cannot continue. &lt;a href="http://kv-emptypages.blogspot.com/2011/02/exploration-of-post-editing-mt-part-i.html"&gt;We need better quality assessment so that this gap can be more clearly defined&lt;/a&gt;.&lt;br /&gt;
&lt;br /&gt;
All MT systems are not equal and to have a global post-editing pricing policy is guaranteed to create disenchantment. We all need to better understand where to use MT and where to avoid it. MT cannot easily if ever replace humans, on the same projects that were previously done through a careful human TEP process. If the quality expectations are high, it has to be MT and human.&amp;nbsp; MT makes most sense where there is ongoing volume and information volatility. We also need to better understand how to quickly assess the output quality of different MT systems so that post-editors are compensated fairly. The best MT systems are yet to come and they will be better because they are the product of informed linguistic steering in addition to standard data and MT techniques. We have yet to see useful compensation systems develop for these linguists and this will probably be needed before some of the uneasiness dissipates, but the forces driving this expanding need are strong and hopefully we should realize and recognize the value of these key individuals at some point in the future. This is already true at Asia Online so I imagine it can be done elsewhere.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
In terms of disintermediation, I think MT will be only part of the whole picture, as we see more people learn to use motivated communities to get work done. &lt;a href="http://www.globalbydesign.com/blog/2010/05/10/adobe-translation-crowdsourcing-china/"&gt;Adobe&lt;/a&gt; and others have learnt to use “the crowd” to get traditional localization work done using translation platforms like &lt;a href="http://www.lingotek.com/content/lingotek-deliver-more-localized-community-translation-adobe"&gt;Lingotek&lt;/a&gt; and newcomer &lt;a href="http://www.examiner.com/tech-industry-in-new-york/interview-with-jack-welde-ceo-of-smartling-video"&gt;Smartling&lt;/a&gt; (&lt;i&gt;which might also have obtained the biggest startup investment made by a VC in the translation industry&lt;/i&gt;.) Much of the coming change will also come from collaboration software platforms like Lingotek, Smartling and &lt;a href="http://www.businesscloud9.com/content/cloudwords-translates-action/6326#.TmUAbe5ybdM.twitter"&gt;others&lt;/a&gt; yet to come, that change how translation projects get done in terms of process flow, and that have a different modus operandi from traditional localization tools born in the TEP world. &lt;b&gt;Translators are required to spend too much time working with data in different formats and too little time on the actual act of translation. New collaboration platforms and real data interchange standards will hopefully enable translators to focus mostly on real linguistic problem solving, and not on &lt;a href="http://www.translationtribulations.com/2011/08/format-surcharging-in-translation.html"&gt;managing archaic and arcane format interchange&lt;/a&gt; issues.&amp;nbsp;&lt;/b&gt; &lt;/div&gt;
&lt;br /&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
From my vantage point, I see that -    &lt;br /&gt;
1) &lt;b&gt;Translation is increasingly done outside of the sphere of the localization world&lt;/b&gt; and community based translation initiatives around the world are gathering momentum both in the non-profit and corporate world     &lt;br /&gt;
2) &lt;b&gt;The volume of translation that can help drive international business initiatives forward is increasing at a substantial rate &lt;/b&gt;(5X to perhaps as much as 100X) Interestingly, there are still some who think that this content explosion is a myth.    &lt;br /&gt;
3) &lt;b&gt;Social network conversations matter and are often more important to translate than having user documentation that is "perfect" and “error-free”.&lt;/b&gt; The company to customer communications have also become much more interactive, real-time and urgent and go way beyond the scope of most user documentation.&amp;nbsp;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
Thus to approach every translation task with the TEP mindset that made great sense in the 1X or 2X volume days is not useful today. New approaches are needed and new models of automation/collaboration are necessary - and are perhaps the only way that all the changing momentum can be handled effectively. MT is simply one part of the equation and is far from being the whole solution. &lt;b&gt;The need to solve this overall translation challenge is linked to the customers business survival so it gains a kind of momentum of inevitability.&lt;/b&gt; Businesses need to translate way more content to remain competitive in global marketplaces that move at internet speeds, thus automation and better collaboration are essential and critical to success and even survival.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&amp;nbsp; &lt;br /&gt;
We have seen in the last 5 years that many of the largest global organizations have launched MT initiatives on their own, because their LSP vendors were/are stuck in the TEP mindset, and did not realize that their customers had to learn to do dramatically more translation with not very much more money. &lt;b&gt;This is perhaps a clue that in certain volume and time constraint scenarios, MT is necessary. We have seen that global enterprises need to solve this problem with or without vendors who historically managed the bulk of their localization translation.&lt;/b&gt; My sense is that this trend is likely to build momentum if LSPs do not learn to offer real MT competence. Real MT competence comes from building custom systems and seeing what works and what does not. Global enterprises will increasingly take this task upon themselves if they cannot find LSPs who can help them solve this problem e.g. TAUS is mostly a buyer driven organization with the key focus of sharing TM and facilitating large scale MT initiatives. The greatest successes presented at TAUS are all in-house initiatives with little LSP involvement. Surely this is because there is a real need, and we see that competitors are willing to share linguistic data and resources to handle this problem.&lt;b&gt; I suspect that the buyer’s motivation is less about saving cents per word on translation costs, and much more about keeping and building customer loyalty and satisfaction in a world with growing global online commerce and information access needs.&lt;/b&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;
My guess is that some of the anxiety on the coming change comes not so much from raw technology like MT, but perhaps it's real origin is the growing awareness that some of the work they are involved with grows less valuable to the &lt;b&gt;customer’s real mission: which is to build and develop international markets.&lt;/b&gt; Perhaps the anxiety is really rooted in the fact that they sense that they are not involved in high value work. &lt;b&gt;The real threat is not MT per se, but it is the growing awareness amongst international marketing executives (in global enterprises) that they need to focus on what their customers really care about - &lt;u&gt;more and more often this is something other than getting a really great user manual out.&lt;/u&gt;&lt;/b&gt; Have you noticed that many leading edge companies like Apple, Sony have dramatically reduced their investment in user manuals? The iPhone simply does not have one (in the box but they do on the web). I am not suggesting that manuals are going away, but it is already clear that their relative value is diminishing. The content that drives global customer adoption and loyalty is changing and thus the relative value of traditional localization (software and documentation) work also changes.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
I expect that new translation production models to build success in international markets will involve MT (and other translation automation), crowdsourcing as well as professional oversight and management. &lt;b&gt;It is very likely that old production models like TEP will be increasingly less important, or just one of several approaches to translation projects as new collaboration models gain momentum&lt;/b&gt;.I think that the most successful approaches to solving these "new" translation problems&amp;nbsp; will involve a close and constructive collaboration between traditional localization professionals, linguists, MT developers, end-customers and probably others in global enterprise organizations who have never worked in "localization" but are more directly concerned about the quality of the relationship with the final customer across the world. &lt;b&gt;At the end of the day our value as an industry is determined by how useful our input is to the process of building international markets and the requirements for success are changing as we speak.&lt;/b&gt;   &lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
The conversations at IMTT and the ensuing discussions suggest that while progress is being made in the understanding of translation technology, there is still a long way to go. I hope that at future IMTT conferences we see more discussion of approaches to translation projects where TEP may not make sense and automation and collaboration approaches can help solve different kinds of problems that also further international business initiatives. I expect that IMTT will be a leader in changing the current polemic and also expand the conversation to new stakeholders. This conversation is likely to require much more direct content with product management, international sales and support teams and the final end customer. Hopefully some of us in the industry get to lead or participate in&amp;nbsp; the driving this change through these new conversations.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
While change can be difficult it can also be a time of opportunity and a time when leadership changes. Very few try to understand the forces of change better. &lt;a href="http://www.resiliencycenter.com/bkstore/ResAdv-chap1.shtml" target="_blank"&gt;People often go through a sequential emotional cycle&lt;/a&gt; before they learn to cope, and eventually even thrive when facing disruptive change. Those who get stuck at fear and despair, often end up as victims.&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
This little video shows that effective and heartfelt communication across cultures need not be heavily planned, ponderous or calculated. Sometimes simple and real is enough to create the change and build a connection to your customers.&lt;/div&gt;
&lt;br /&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;iframe frameborder="0" height="225" src="http://player.vimeo.com/video/1211060?title=0&amp;amp;byline=0&amp;amp;portrait=0" width="400"&gt;&lt;/iframe&gt;&lt;/div&gt;
&lt;a href="http://vimeo.com/1211060"&gt;Where the Hell is Matt? (2008)&lt;/a&gt; from &lt;a href="http://vimeo.com/user484313"&gt;Matthew Harding&lt;/a&gt; on &lt;a href="http://vimeo.com/"&gt;Vimeo&lt;/a&gt;.&lt;br /&gt;
&lt;br /&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-12580934454006820?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/ewlt_8Neq2T-u7WITmYkq3P3tDA/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/ewlt_8Neq2T-u7WITmYkq3P3tDA/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/ewlt_8Neq2T-u7WITmYkq3P3tDA/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/ewlt_8Neq2T-u7WITmYkq3P3tDA/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=pPZNY3eK3Sc:Dh7FgArYh7Q:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=pPZNY3eK3Sc:Dh7FgArYh7Q:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=pPZNY3eK3Sc:Dh7FgArYh7Q:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=pPZNY3eK3Sc:Dh7FgArYh7Q:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/pPZNY3eK3Sc" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/12580934454006820/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/09/continuing-saga-evolution-of-machine.html#comment-form" title="15 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/12580934454006820?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/12580934454006820?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/pPZNY3eK3Sc/continuing-saga-evolution-of-machine.html" title="The Continuing Saga &amp;amp; Evolution of Machine Translation" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://lh5.ggpht.com/-OELDJGLd724/TmUC-jBJa0I/AAAAAAAAAQM/AHTo9EBetuw/s72-c/317201_10150297433683886_25478884388%25255B1%25255D.jpg?imgmax=800" height="72" width="72" /><thr:total>15</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/09/continuing-saga-evolution-of-machine.html</feedburner:origLink></entry><entry gd:etag="W/&quot;AkQMSXY_eip7ImA9WhRVFEU.&quot;"><id>tag:blogger.com,1999:blog-6748877443699290050.post-6564386157674830296</id><published>2011-08-01T12:59:00.000-07:00</published><updated>2012-01-13T12:59:48.842-08:00</updated><app:edited xmlns:app="http://www.w3.org/2007/app">2012-01-13T12:59:48.842-08:00</app:edited><category scheme="http://www.blogger.com/atom/ns#" term="crowdsourcing" /><category scheme="http://www.blogger.com/atom/ns#" term="localization" /><title>Translation Crowdsourcing</title><content type="html">&lt;div dir="ltr" style="text-align: left;" trbidi="on"&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;The phenomena of a crowd (or community) stepping forward and
doing real translation work, often for no&amp;nbsp;direct financial compensation is
something that troubles many in the professional translation world.&amp;nbsp;Mostly
because they see this activity, as work being taken away from legitimate
professionals or they see it as a ploy to reduce prices. While in some cases
their fears may actually be justified, in the most successful uses of this
approach&amp;nbsp;I think it is clear that this is not true.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;As I have said before, the &lt;/span&gt;&lt;a href="http://kv-emptypages.blogspot.com/2010/04/data-deluge-and-growing-need-for.html"&gt;&lt;b&gt;growing momentum in the volume of
content&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt; demands &lt;/span&gt;&lt;a href="http://kv-emptypages.blogspot.com/2010/01/why-machine-translation-matters-for.html"&gt;&lt;b&gt;new production models&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt;. This momentum
which exists both in the corporate world and also the &lt;/span&gt;&lt;span style="color: #204063;"&gt;general &lt;/span&gt;&lt;span style="color: #204063;"&gt;world out there simply
cannot be addressed by ONLY using traditional professional translation
production models. New needs require new approaches. For those who insist that the data deluge is a fiction, the rest of this post is probably irrelevant.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;Another key driving force behind new crowdsourcing initiatives
is the need to engage and interact with users in new markets. In new markets
having active conversations with locals is key to building brand awareness and
really learning about local needs and behavior. This is frequently a more
important driver than cost containment as many in the industry think.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;In some cases were it not for crowd-based localization efforts,
it would simply not be done as it is not economically feasible to undertake the
same efforts (and expenses) as are made for FIGS/CJK for “lesser” languages.
Thus crowdsourcing is emerging sometimes as a means to get “lesser” languages
done.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;If we look at some of the most successful examples of
crowd-sourced translation in practice, we can see that they have many if not all
of the following elements in common.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;&lt;span style="color: #204063; font-size: 12pt;"&gt;A Crowd/Community
That Is Invested:&lt;/span&gt;&lt;/b&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://4.bp.blogspot.com/-cV97LzbxggI/TjcydLX3waI/AAAAAAAAAP8/B3wVHPsnW2E/s1600/TED+Languages.jpg" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" height="221" src="http://4.bp.blogspot.com/-cV97LzbxggI/TjcydLX3waI/AAAAAAAAAP8/B3wVHPsnW2E/s320/TED+Languages.jpg" width="320" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;/div&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraph" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
·&lt;span style="-moz-font-feature-settings: normal; -moz-font-language-override: normal; font-size-adjust: none; font-size: 7pt; font-stretch: normal; font-style: normal; font-variant: normal; font-weight: normal; line-height: normal;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;
&lt;/span&gt;&lt;b&gt;&lt;a href="http://www.ted.com/OpenTranslationProject"&gt;TED Open Translation Project&amp;nbsp;&lt;/a&gt;&lt;/b&gt;&lt;span style="color: #204063;"&gt;– Volunteer
translators are often inspired&amp;nbsp;by the&amp;nbsp;content and wish to share it
with their&amp;nbsp;friends and countrymen.&amp;nbsp;June Cohen has said that &lt;/span&gt;&lt;a href="http://www.ted.com/pages/view/id/290"&gt;&lt;b&gt;the
volunteer translators&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt; in general do better quality work than the many of the paid
professionals, who initially did a few translations to seed the project because
of their passion for the subject and often their subject matter expertise. This effort has now enabled over 20,000
translations into 80+ languages of really challenging material. Many
professionals also volunteer because they believe in the high general value of the
content.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoListParagraph" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://1.bp.blogspot.com/-NhSHpF303G8/Tjb5oRZWR6I/AAAAAAAAAPw/-HAljT2fObw/s1600/TED+Volunteers.jpg" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" height="206" src="http://1.bp.blogspot.com/-NhSHpF303G8/Tjb5oRZWR6I/AAAAAAAAAPw/-HAljT2fObw/s320/TED+Volunteers.jpg" width="320" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;/div&gt;
&lt;div class="MsoListParagraph" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraph" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;span style="color: #204063;"&gt; &lt;/span&gt;&lt;/div&gt;
&lt;div align="center" class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-align: center;"&gt;
&lt;span style="color: #204063;"&gt;&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpFirst" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
·&lt;span style="-moz-font-feature-settings: normal; -moz-font-language-override: normal; font-size-adjust: none; font-size: 7pt; font-stretch: normal; font-style: normal; font-variant: normal; font-weight: normal; line-height: normal;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;
&lt;/span&gt;&lt;a href="http://techcrunch.com/2008/02/07/facebook-turns-1500-users-into-spanish-translation-slaves/"&gt;&lt;b&gt;Facebook&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt;&amp;nbsp;– Users who
wish to build and expand the friend community in their particular language
group. This effort has enabled Facebook to grow rapidly in international
markets and accomplish very rapid coverage across 60+ languages. Had they used
traditional means to do this it may have taken them years to get to the same
point. Critics also often miss the point that engaging real users in the
translation task also encourages rapid growth of the user base as “user
translators” engage friends into their network.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpFirst" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpMiddle" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
·&lt;span style="-moz-font-feature-settings: normal; -moz-font-language-override: normal; font-size-adjust: none; font-size: 7pt; font-stretch: normal; font-style: normal; font-variant: normal; font-weight: normal; line-height: normal;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;
&lt;/span&gt;&lt;a href="http://support.microsoft.com/"&gt;&lt;b&gt;Microsoft&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt; - MVPs (top
accredited reseller partners) who wish to make technical support knowledge
about&amp;nbsp;Microsoft products more easily and widely available in their
markets. Their efforts are rewarded by lower support costs and also an increase
in product sales as more and more users look for self-service knowledge base
information. Microsoft has been a trail blazer in making large amounts of knowledge base content available via MT, they are now adding crowd based editing to raise the quality of the translated information. Thus the most used and vital information tends to get the most attention and benefits all users. &lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpMiddle" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpLast" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
·&lt;span style="-moz-font-feature-settings: normal; -moz-font-language-override: normal; font-size-adjust: none; font-size: 7pt; font-stretch: normal; font-style: normal; font-variant: normal; font-weight: normal; line-height: normal;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;
&lt;/span&gt;&lt;a href="http://www.asiaonline.net/portal.aspx"&gt;&lt;b&gt;Asia Online&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt;&amp;nbsp;– Student
users provide corrective feedback to continue to improve the&amp;nbsp;translation
quality of the&amp;nbsp;Wikipedia and other knowledge content that is
initially&amp;nbsp;done by&amp;nbsp;highly&amp;nbsp;customized MT engines and paid
translators. The students themselves will be the primary beneficiaries of this
content, and their efforts will enable them to access high quality educational
information. The volume of this information will likely increase a thousand
fold.&lt;/span&gt;&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://3.bp.blogspot.com/-6jYzBQHoXzI/Tjb59JUl2ZI/AAAAAAAAAP0/Eq4w18_OX-A/s1600/AsiaOnline+Call.jpg" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" height="173" src="http://3.bp.blogspot.com/-6jYzBQHoXzI/Tjb59JUl2ZI/AAAAAAAAAP0/Eq4w18_OX-A/s320/AsiaOnline+Call.jpg" width="320" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpLast" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpFirst" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&amp;nbsp;·&lt;span style="-moz-font-feature-settings: normal; -moz-font-language-override: normal; font-size-adjust: none; font-size: 7pt; font-stretch: normal; font-style: normal; font-variant: normal; font-weight: normal; line-height: normal;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;
&lt;/span&gt;&lt;a href="http://www.niemanlab.org/2010/06/the-wikipedia-of-news-translation-yeeyan-orgs-volunteer-community/"&gt;&lt;b&gt;Yeeyan:&amp;nbsp;&lt;/b&gt;&lt;/a&gt;&lt;span style="color: #204063;"&gt; &lt;/span&gt;has 150,000 registered 
users, who collectively translate 50 to 100 news articles every day from
 English to Chinese. Since its inception in 2006, the site has grown 
into a key gateway for Chinese speakers who want to follow international
 news. It has been so successful that it has attracted the attention of 
major news sources like &lt;a href="http://www.guardian.co.uk/world/2009/dec/03/yeeyan-china-guardian-media-mandarin"&gt;The Guardian&lt;/a&gt; and ReadWriteWeb. Yeeyan is focused on addressing the &lt;a href="http://www.niemanlab.org/2010/06/the-wikipedia-of-news-translation-yeeyan-orgs-volunteer-community/"&gt;problem of ghettoization of information by language&lt;/a&gt; through a community collaboration, where members both identify interesting content and also help to translate this content.&lt;br /&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://3.bp.blogspot.com/-dX_7wmZEMFg/Tjcy8dueTtI/AAAAAAAAAQA/-VpuRmb94lA/s1600/Yeeyanlogo.png" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" src="http://3.bp.blogspot.com/-dX_7wmZEMFg/Tjcy8dueTtI/AAAAAAAAAQA/-VpuRmb94lA/s1600/Yeeyanlogo.png" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;div class="separator" style="clear: both; text-align: center;"&gt;
&lt;a href="http://3.bp.blogspot.com/-i5DZsjv56NA/TjczGdun3NI/AAAAAAAAAQE/cSoWCXao_lE/s1600/yeeyanparalleltext.png" imageanchor="1" style="margin-left: 1em; margin-right: 1em;"&gt;&lt;img border="0" height="309" src="http://3.bp.blogspot.com/-i5DZsjv56NA/TjczGdun3NI/AAAAAAAAAQE/cSoWCXao_lE/s320/yeeyanparalleltext.png" width="320" /&gt;&lt;/a&gt;&lt;/div&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpFirst" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpMiddle" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif; text-indent: -0.25in;"&gt;
·&lt;span style="-moz-font-feature-settings: normal; -moz-font-language-override: normal; font-size-adjust: none; font-size: 7pt; font-stretch: normal; font-style: normal; font-variant: normal; font-weight: normal; line-height: normal;"&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;
&lt;/span&gt;&lt;span style="color: #204063;"&gt;&lt;a href="http://www.globalbydesign.com/blog/2010/05/10/adobe-translation-crowdsourcing-china/"&gt;&lt;b&gt;Adobe&lt;/b&gt;&lt;/a&gt;:
This is a much more carefully managed effort designed to engage influential
users, partners and customers to help provide relevant information for the
broad Adobe User community in China.&lt;/span&gt;&lt;br /&gt;
&lt;br /&gt;
&lt;span style="color: #204063;"&gt;T&amp;nbsp;&amp;nbsp;&amp;nbsp;&lt;b&gt;&lt;a href="http://translate.twttr.com/welcome"&gt;Twitter:&lt;/a&gt;&lt;/b&gt; &lt;/span&gt;The translation center asks Twitter users -- all volunteers -- to 
help translate Twitter's interface into various languages.  Once the 
basic support pages are translated, a select group of the "most active" 
translators are invited to work with Twitter to "maintain localized 
versions of the service." Twitter boasts that its translation center has 200,000 translators,
 and that the localization process for Dutch and Indonesian took just 
one month from the first call for involvement to its announcement. The availability of its interface in multiple foreign languages is bound
 to increase its popularity and effectiveness not only for online 
marketing but also for social and political activism.&lt;/div&gt;
&lt;div class="MsoListParagraphCxSpLast" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;&lt;span style="color: #204063; font-size: 12pt;"&gt;Software
Infrastructure That Facilitates Contribution &amp;amp; Participation:&lt;/span&gt;&lt;/b&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;In all of the cases above the companies involved crowdsourced
translation initiatives need to invest in software that enables tasks to be
parceled out, evolve as tasks change, enable efficient administration, maintain
quality, gather feedback, and build self-sustaining eco-systems. The tools
developed by dotSUB, Lingotek, Yeeyan&amp;nbsp;and Asia Online are all unique
collaboration and translation workflow management tools that enable these kinds
of initiatives, They make little or no use of industry standard tools like
Trados and TMS because of the highly proprietary, rigidity and archaic nature
of these tools. These new-generation tools are much more open and are designed
to evolve with technical and process advances on the internet today. It is quite possible that these community efforts could produce tools that supercede many of the tools in use today as these new tools focus on collaboration and sharing assets to enhance the efficiency of the collaborative translation process.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;b&gt;&lt;span style="color: #204063; font-size: 12pt;"&gt;The Importance of
Engagement and Higher Purpose&lt;/span&gt;&lt;/b&gt;&lt;span style="color: #204063; font-size: 12pt;"&gt;:&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;It is interesting to note that translation is not the primary
business of any of the companies listed in the examples above. In every case
the goal and intent is &lt;b&gt;to
make more information available faster&lt;/b&gt;. Even for many of the
corporations that are exploring crowdsourcing, the rationale is often more about
customer engagement than cost savings. &lt;b&gt;It
is also important to note that none of these&amp;nbsp;initiatives could even be attempted
without the use of automation and&amp;nbsp;large-scale community support and they
are enabling initiatives that would not be possible otherwise.&lt;/b&gt;
This is also true for Facebook who still had to use professionals to translate
legalese that their community was not interested in translating. &amp;nbsp;The role
of communities is likely to increase in future as more of the world comes
online.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;As we move forward we will see much more video and other rich content come online and
already it is clear that the old approaches will not enable us to make this new
content multilingual in an effective time frame. Crowdsourcing and automated
translation will be necessary tools for an organization that seeks to communicate
across the globe. As Clay Shirky has pointed out, the ‘cognitive surplus’ of
the online population is a force that can be harnessed under the right
circumstances and for the right purposes. It is likely that the professional
translation world is going to see significant disruption in the coming years,
as innovators figure out how to build sustainable models around community
engagement, technology and organizational mission. However, as we have already seen, there is much that the crowd has no interest in doing and we should expect that this is not likely to change.&lt;/span&gt;&lt;/div&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;br /&gt;&lt;/div&gt;
&lt;span style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;

&lt;/span&gt;&lt;br /&gt;
&lt;div class="MsoNormal" style="font-family: &amp;quot;Trebuchet MS&amp;quot;,sans-serif;"&gt;
&lt;span style="color: #204063;"&gt;Crowdsourcing is here to stay and is a new mode of production
that enables high–volume projects to be undertaken, engage with users and
partners more deeply and participate in multilingual social networks where so
many branding impressions are being formed. Managing crowdsourcing is also a
major opportunity for savvy LSPs who have processes in place to recruit and
manage the collaboration of dispersed volunteers and contributors.&lt;/span&gt;&lt;/div&gt;
&lt;/div&gt;&lt;div class="blogger-post-footer"&gt;&lt;img width='1' height='1' src='https://blogger.googleusercontent.com/tracker/6748877443699290050-6564386157674830296?l=kv-emptypages.blogspot.com' alt='' /&gt;&lt;/div&gt;
&lt;p&gt;&lt;a href="http://feedads.g.doubleclick.net/~a/M_f3g2R5_Fokt-w_Y91VqOxKAsQ/0/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/M_f3g2R5_Fokt-w_Y91VqOxKAsQ/0/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;br/&gt;
&lt;a href="http://feedads.g.doubleclick.net/~a/M_f3g2R5_Fokt-w_Y91VqOxKAsQ/1/da"&gt;&lt;img src="http://feedads.g.doubleclick.net/~a/M_f3g2R5_Fokt-w_Y91VqOxKAsQ/1/di" border="0" ismap="true"&gt;&lt;/img&gt;&lt;/a&gt;&lt;/p&gt;&lt;div class="feedflare"&gt;
&lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=FraJrdgQpXM:Ipw497g7WvU:yIl2AUoC8zA"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=yIl2AUoC8zA" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=FraJrdgQpXM:Ipw497g7WvU:F7zBnMyn0Lo"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?i=FraJrdgQpXM:Ipw497g7WvU:F7zBnMyn0Lo" border="0"&gt;&lt;/img&gt;&lt;/a&gt; &lt;a href="http://feeds.feedburner.com/~ff/EmptyPages?a=FraJrdgQpXM:Ipw497g7WvU:qj6IDK7rITs"&gt;&lt;img src="http://feeds.feedburner.com/~ff/EmptyPages?d=qj6IDK7rITs" border="0"&gt;&lt;/img&gt;&lt;/a&gt;
&lt;/div&gt;&lt;img src="http://feeds.feedburner.com/~r/EmptyPages/~4/FraJrdgQpXM" height="1" width="1"/&gt;</content><link rel="replies" type="application/atom+xml" href="http://kv-emptypages.blogspot.com/feeds/6564386157674830296/comments/default" title="Post Comments" /><link rel="replies" type="text/html" href="http://kv-emptypages.blogspot.com/2011/08/translation-crowdsourcing.html#comment-form" title="2 Comments" /><link rel="edit" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/6564386157674830296?v=2" /><link rel="self" type="application/atom+xml" href="http://www.blogger.com/feeds/6748877443699290050/posts/default/6564386157674830296?v=2" /><link rel="alternate" type="text/html" href="http://feedproxy.google.com/~r/EmptyPages/~3/FraJrdgQpXM/translation-crowdsourcing.html" title="Translation Crowdsourcing" /><author><name>Kirti Vashee</name><uri>http://www.blogger.com/profile/16795076802721564830</uri><email>noreply@blogger.com</email><gd:image rel="http://schemas.google.com/g/2005#thumbnail" width="24" height="32" src="http://1.bp.blogspot.com/_PNHg7X3zPiw/S0z-9sDoJKI/AAAAAAAAAAg/kR6cP688M5k/S220/kv_cartoonizer.jpg" /></author><media:thumbnail xmlns:media="http://search.yahoo.com/mrss/" url="http://4.bp.blogspot.com/-cV97LzbxggI/TjcydLX3waI/AAAAAAAAAP8/B3wVHPsnW2E/s72-c/TED+Languages.jpg" height="72" width="72" /><thr:total>2</thr:total><feedburner:origLink>http://kv-emptypages.blogspot.com/2011/08/translation-crowdsourcing.html</feedburner:origLink></entry></feed>

