added mgiza

2017-01-21 17:07:36 +01:00 · 2017-01-21 17:07:36 +01:00 · df5dddc924
commit df5dddc924
parent 6f995a64f2
676 changed files with 212224 additions and 0 deletions
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.cproject
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.cproject
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.cvsignore
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.cvsignore
@ -0,0 +1,37 @@
+.anjuta
+.tm_project*
+.libs
+.deps
+.*swp
+.nautilus-metafile.xml
+*.autosave
+*.pws
+*.bak
+*~
+#*#
+*.gladep
+*.la
+*.lo
+*.o
+*.class
+*.pyc
+aclocal.m4
+autom4te.cache
+config.h
+config.h.in
+config.log
+config.status
+configure
+intltool-extract*
+intltool-merge*
+intltool-modules*
+intltool-update*
+libtool
+prepare.sh
+stamp-h*
+ltmain.sh
+mkinstalldirs
+config.guess
+config.sub
+Makefile
+Makefile.in
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.project
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.project
@ -0,0 +1,82 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<projectDescription>
+	<name>MGizaWhiteList</name>
+	<comment></comment>
+	<projects>
+	</projects>
+	<buildSpec>
+		<buildCommand>
+			<name>org.eclipse.cdt.managedbuilder.core.genmakebuilder</name>
+			<triggers>clean,full,incremental,</triggers>
+			<arguments>
+				<dictionary>
+					<key>?name?</key>
+					<value></value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.append_environment</key>
+					<value>true</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.autoBuildTarget</key>
+					<value>all</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.buildArguments</key>
+					<value></value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.buildCommand</key>
+					<value>make</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.buildLocation</key>
+					<value>${workspace_loc:/MGizaWhiteList/Debug}</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.cleanBuildTarget</key>
+					<value>clean</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.contents</key>
+					<value>org.eclipse.cdt.make.core.activeConfigSettings</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.enableAutoBuild</key>
+					<value>false</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.enableCleanBuild</key>
+					<value>true</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.enableFullBuild</key>
+					<value>true</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.fullBuildTarget</key>
+					<value>all</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.stopOnError</key>
+					<value>true</value>
+				</dictionary>
+				<dictionary>
+					<key>org.eclipse.cdt.make.core.useDefaultBuildCmd</key>
+					<value>true</value>
+				</dictionary>
+			</arguments>
+		</buildCommand>
+		<buildCommand>
+			<name>org.eclipse.cdt.managedbuilder.core.ScannerConfigBuilder</name>
+			<arguments>
+			</arguments>
+		</buildCommand>
+	</buildSpec>
+	<natures>
+		<nature>org.eclipse.cdt.core.cnature</nature>
+		<nature>org.eclipse.cdt.core.ccnature</nature>
+		<nature>org.eclipse.cdt.managedbuilder.core.managedBuildNature</nature>
+		<nature>org.eclipse.cdt.managedbuilder.core.ScannerConfigNature</nature>
+	</natures>
+</projectDescription>
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.tm_project2.cache
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/.tm_project2.cache
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/AUTHORS
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/AUTHORS
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/COPYING
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/COPYING
@ -0,0 +1,674 @@
+                    GNU GENERAL PUBLIC LICENSE
+                       Version 3, 29 June 2007
+
+ Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+                            Preamble
+
+  The GNU General Public License is a free, copyleft license for
+software and other kinds of works.
+
+  The licenses for most software and other practical works are designed
+to take away your freedom to share and change the works.  By contrast,
+the GNU General Public License is intended to guarantee your freedom to
+share and change all versions of a program--to make sure it remains free
+software for all its users.  We, the Free Software Foundation, use the
+GNU General Public License for most of our software; it applies also to
+any other work released this way by its authors.  You can apply it to
+your programs, too.
+
+  When we speak of free software, we are referring to freedom, not
+price.  Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+them if you wish), that you receive source code or can get it if you
+want it, that you can change the software or use pieces of it in new
+free programs, and that you know you can do these things.
+
+  To protect your rights, we need to prevent others from denying you
+these rights or asking you to surrender the rights.  Therefore, you have
+certain responsibilities if you distribute copies of the software, or if
+you modify it: responsibilities to respect the freedom of others.
+
+  For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must pass on to the recipients the same
+freedoms that you received.  You must make sure that they, too, receive
+or can get the source code.  And you must show them these terms so they
+know their rights.
+
+  Developers that use the GNU GPL protect your rights with two steps:
+(1) assert copyright on the software, and (2) offer you this License
+giving you legal permission to copy, distribute and/or modify it.
+
+  For the developers' and authors' protection, the GPL clearly explains
+that there is no warranty for this free software.  For both users' and
+authors' sake, the GPL requires that modified versions be marked as
+changed, so that their problems will not be attributed erroneously to
+authors of previous versions.
+
+  Some devices are designed to deny users access to install or run
+modified versions of the software inside them, although the manufacturer
+can do so.  This is fundamentally incompatible with the aim of
+protecting users' freedom to change the software.  The systematic
+pattern of such abuse occurs in the area of products for individuals to
+use, which is precisely where it is most unacceptable.  Therefore, we
+have designed this version of the GPL to prohibit the practice for those
+products.  If such problems arise substantially in other domains, we
+stand ready to extend this provision to those domains in future versions
+of the GPL, as needed to protect the freedom of users.
+
+  Finally, every program is threatened constantly by software patents.
+States should not allow patents to restrict development and use of
+software on general-purpose computers, but in those that do, we wish to
+avoid the special danger that patents applied to a free program could
+make it effectively proprietary.  To prevent this, the GPL assures that
+patents cannot be used to render the program non-free.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.
+
+                       TERMS AND CONDITIONS
+
+  0. Definitions.
+
+  "This License" refers to version 3 of the GNU General Public License.
+
+  "Copyright" also means copyright-like laws that apply to other kinds of
+works, such as semiconductor masks.
+
+  "The Program" refers to any copyrightable work licensed under this
+License.  Each licensee is addressed as "you".  "Licensees" and
+"recipients" may be individuals or organizations.
+
+  To "modify" a work means to copy from or adapt all or part of the work
+in a fashion requiring copyright permission, other than the making of an
+exact copy.  The resulting work is called a "modified version" of the
+earlier work or a work "based on" the earlier work.
+
+  A "covered work" means either the unmodified Program or a work based
+on the Program.
+
+  To "propagate" a work means to do anything with it that, without
+permission, would make you directly or secondarily liable for
+infringement under applicable copyright law, except executing it on a
+computer or modifying a private copy.  Propagation includes copying,
+distribution (with or without modification), making available to the
+public, and in some countries other activities as well.
+
+  To "convey" a work means any kind of propagation that enables other
+parties to make or receive copies.  Mere interaction with a user through
+a computer network, with no transfer of a copy, is not conveying.
+
+  An interactive user interface displays "Appropriate Legal Notices"
+to the extent that it includes a convenient and prominently visible
+feature that (1) displays an appropriate copyright notice, and (2)
+tells the user that there is no warranty for the work (except to the
+extent that warranties are provided), that licensees may convey the
+work under this License, and how to view a copy of this License.  If
+the interface presents a list of user commands or options, such as a
+menu, a prominent item in the list meets this criterion.
+
+  1. Source Code.
+
+  The "source code" for a work means the preferred form of the work
+for making modifications to it.  "Object code" means any non-source
+form of a work.
+
+  A "Standard Interface" means an interface that either is an official
+standard defined by a recognized standards body, or, in the case of
+interfaces specified for a particular programming language, one that
+is widely used among developers working in that language.
+
+  The "System Libraries" of an executable work include anything, other
+than the work as a whole, that (a) is included in the normal form of
+packaging a Major Component, but which is not part of that Major
+Component, and (b) serves only to enable use of the work with that
+Major Component, or to implement a Standard Interface for which an
+implementation is available to the public in source code form.  A
+"Major Component", in this context, means a major essential component
+(kernel, window system, and so on) of the specific operating system
+(if any) on which the executable work runs, or a compiler used to
+produce the work, or an object code interpreter used to run it.
+
+  The "Corresponding Source" for a work in object code form means all
+the source code needed to generate, install, and (for an executable
+work) run the object code and to modify the work, including scripts to
+control those activities.  However, it does not include the work's
+System Libraries, or general-purpose tools or generally available free
+programs which are used unmodified in performing those activities but
+which are not part of the work.  For example, Corresponding Source
+includes interface definition files associated with source files for
+the work, and the source code for shared libraries and dynamically
+linked subprograms that the work is specifically designed to require,
+such as by intimate data communication or control flow between those
+subprograms and other parts of the work.
+
+  The Corresponding Source need not include anything that users
+can regenerate automatically from other parts of the Corresponding
+Source.
+
+  The Corresponding Source for a work in source code form is that
+same work.
+
+  2. Basic Permissions.
+
+  All rights granted under this License are granted for the term of
+copyright on the Program, and are irrevocable provided the stated
+conditions are met.  This License explicitly affirms your unlimited
+permission to run the unmodified Program.  The output from running a
+covered work is covered by this License only if the output, given its
+content, constitutes a covered work.  This License acknowledges your
+rights of fair use or other equivalent, as provided by copyright law.
+
+  You may make, run and propagate covered works that you do not
+convey, without conditions so long as your license otherwise remains
+in force.  You may convey covered works to others for the sole purpose
+of having them make modifications exclusively for you, or provide you
+with facilities for running those works, provided that you comply with
+the terms of this License in conveying all material for which you do
+not control copyright.  Those thus making or running the covered works
+for you must do so exclusively on your behalf, under your direction
+and control, on terms that prohibit them from making any copies of
+your copyrighted material outside their relationship with you.
+
+  Conveying under any other circumstances is permitted solely under
+the conditions stated below.  Sublicensing is not allowed; section 10
+makes it unnecessary.
+
+  3. Protecting Users' Legal Rights From Anti-Circumvention Law.
+
+  No covered work shall be deemed part of an effective technological
+measure under any applicable law fulfilling obligations under article
+11 of the WIPO copyright treaty adopted on 20 December 1996, or
+similar laws prohibiting or restricting circumvention of such
+measures.
+
+  When you convey a covered work, you waive any legal power to forbid
+circumvention of technological measures to the extent such circumvention
+is effected by exercising rights under this License with respect to
+the covered work, and you disclaim any intention to limit operation or
+modification of the work as a means of enforcing, against the work's
+users, your or third parties' legal rights to forbid circumvention of
+technological measures.
+
+  4. Conveying Verbatim Copies.
+
+  You may convey verbatim copies of the Program's source code as you
+receive it, in any medium, provided that you conspicuously and
+appropriately publish on each copy an appropriate copyright notice;
+keep intact all notices stating that this License and any
+non-permissive terms added in accord with section 7 apply to the code;
+keep intact all notices of the absence of any warranty; and give all
+recipients a copy of this License along with the Program.
+
+  You may charge any price or no price for each copy that you convey,
+and you may offer support or warranty protection for a fee.
+
+  5. Conveying Modified Source Versions.
+
+  You may convey a work based on the Program, or the modifications to
+produce it from the Program, in the form of source code under the
+terms of section 4, provided that you also meet all of these conditions:
+
+    a) The work must carry prominent notices stating that you modified
+    it, and giving a relevant date.
+
+    b) The work must carry prominent notices stating that it is
+    released under this License and any conditions added under section
+    7.  This requirement modifies the requirement in section 4 to
+    "keep intact all notices".
+
+    c) You must license the entire work, as a whole, under this
+    License to anyone who comes into possession of a copy.  This
+    License will therefore apply, along with any applicable section 7
+    additional terms, to the whole of the work, and all its parts,
+    regardless of how they are packaged.  This License gives no
+    permission to license the work in any other way, but it does not
+    invalidate such permission if you have separately received it.
+
+    d) If the work has interactive user interfaces, each must display
+    Appropriate Legal Notices; however, if the Program has interactive
+    interfaces that do not display Appropriate Legal Notices, your
+    work need not make them do so.
+
+  A compilation of a covered work with other separate and independent
+works, which are not by their nature extensions of the covered work,
+and which are not combined with it such as to form a larger program,
+in or on a volume of a storage or distribution medium, is called an
+"aggregate" if the compilation and its resulting copyright are not
+used to limit the access or legal rights of the compilation's users
+beyond what the individual works permit.  Inclusion of a covered work
+in an aggregate does not cause this License to apply to the other
+parts of the aggregate.
+
+  6. Conveying Non-Source Forms.
+
+  You may convey a covered work in object code form under the terms
+of sections 4 and 5, provided that you also convey the
+machine-readable Corresponding Source under the terms of this License,
+in one of these ways:
+
+    a) Convey the object code in, or embodied in, a physical product
+    (including a physical distribution medium), accompanied by the
+    Corresponding Source fixed on a durable physical medium
+    customarily used for software interchange.
+
+    b) Convey the object code in, or embodied in, a physical product
+    (including a physical distribution medium), accompanied by a
+    written offer, valid for at least three years and valid for as
+    long as you offer spare parts or customer support for that product
+    model, to give anyone who possesses the object code either (1) a
+    copy of the Corresponding Source for all the software in the
+    product that is covered by this License, on a durable physical
+    medium customarily used for software interchange, for a price no
+    more than your reasonable cost of physically performing this
+    conveying of source, or (2) access to copy the
+    Corresponding Source from a network server at no charge.
+
+    c) Convey individual copies of the object code with a copy of the
+    written offer to provide the Corresponding Source.  This
+    alternative is allowed only occasionally and noncommercially, and
+    only if you received the object code with such an offer, in accord
+    with subsection 6b.
+
+    d) Convey the object code by offering access from a designated
+    place (gratis or for a charge), and offer equivalent access to the
+    Corresponding Source in the same way through the same place at no
+    further charge.  You need not require recipients to copy the
+    Corresponding Source along with the object code.  If the place to
+    copy the object code is a network server, the Corresponding Source
+    may be on a different server (operated by you or a third party)
+    that supports equivalent copying facilities, provided you maintain
+    clear directions next to the object code saying where to find the
+    Corresponding Source.  Regardless of what server hosts the
+    Corresponding Source, you remain obligated to ensure that it is
+    available for as long as needed to satisfy these requirements.
+
+    e) Convey the object code using peer-to-peer transmission, provided
+    you inform other peers where the object code and Corresponding
+    Source of the work are being offered to the general public at no
+    charge under subsection 6d.
+
+  A separable portion of the object code, whose source code is excluded
+from the Corresponding Source as a System Library, need not be
+included in conveying the object code work.
+
+  A "User Product" is either (1) a "consumer product", which means any
+tangible personal property which is normally used for personal, family,
+or household purposes, or (2) anything designed or sold for incorporation
+into a dwelling.  In determining whether a product is a consumer product,
+doubtful cases shall be resolved in favor of coverage.  For a particular
+product received by a particular user, "normally used" refers to a
+typical or common use of that class of product, regardless of the status
+of the particular user or of the way in which the particular user
+actually uses, or expects or is expected to use, the product.  A product
+is a consumer product regardless of whether the product has substantial
+commercial, industrial or non-consumer uses, unless such uses represent
+the only significant mode of use of the product.
+
+  "Installation Information" for a User Product means any methods,
+procedures, authorization keys, or other information required to install
+and execute modified versions of a covered work in that User Product from
+a modified version of its Corresponding Source.  The information must
+suffice to ensure that the continued functioning of the modified object
+code is in no case prevented or interfered with solely because
+modification has been made.
+
+  If you convey an object code work under this section in, or with, or
+specifically for use in, a User Product, and the conveying occurs as
+part of a transaction in which the right of possession and use of the
+User Product is transferred to the recipient in perpetuity or for a
+fixed term (regardless of how the transaction is characterized), the
+Corresponding Source conveyed under this section must be accompanied
+by the Installation Information.  But this requirement does not apply
+if neither you nor any third party retains the ability to install
+modified object code on the User Product (for example, the work has
+been installed in ROM).
+
+  The requirement to provide Installation Information does not include a
+requirement to continue to provide support service, warranty, or updates
+for a work that has been modified or installed by the recipient, or for
+the User Product in which it has been modified or installed.  Access to a
+network may be denied when the modification itself materially and
+adversely affects the operation of the network or violates the rules and
+protocols for communication across the network.
+
+  Corresponding Source conveyed, and Installation Information provided,
+in accord with this section must be in a format that is publicly
+documented (and with an implementation available to the public in
+source code form), and must require no special password or key for
+unpacking, reading or copying.
+
+  7. Additional Terms.
+
+  "Additional permissions" are terms that supplement the terms of this
+License by making exceptions from one or more of its conditions.
+Additional permissions that are applicable to the entire Program shall
+be treated as though they were included in this License, to the extent
+that they are valid under applicable law.  If additional permissions
+apply only to part of the Program, that part may be used separately
+under those permissions, but the entire Program remains governed by
+this License without regard to the additional permissions.
+
+  When you convey a copy of a covered work, you may at your option
+remove any additional permissions from that copy, or from any part of
+it.  (Additional permissions may be written to require their own
+removal in certain cases when you modify the work.)  You may place
+additional permissions on material, added by you to a covered work,
+for which you have or can give appropriate copyright permission.
+
+  Notwithstanding any other provision of this License, for material you
+add to a covered work, you may (if authorized by the copyright holders of
+that material) supplement the terms of this License with terms:
+
+    a) Disclaiming warranty or limiting liability differently from the
+    terms of sections 15 and 16 of this License; or
+
+    b) Requiring preservation of specified reasonable legal notices or
+    author attributions in that material or in the Appropriate Legal
+    Notices displayed by works containing it; or
+
+    c) Prohibiting misrepresentation of the origin of that material, or
+    requiring that modified versions of such material be marked in
+    reasonable ways as different from the original version; or
+
+    d) Limiting the use for publicity purposes of names of licensors or
+    authors of the material; or
+
+    e) Declining to grant rights under trademark law for use of some
+    trade names, trademarks, or service marks; or
+
+    f) Requiring indemnification of licensors and authors of that
+    material by anyone who conveys the material (or modified versions of
+    it) with contractual assumptions of liability to the recipient, for
+    any liability that these contractual assumptions directly impose on
+    those licensors and authors.
+
+  All other non-permissive additional terms are considered "further
+restrictions" within the meaning of section 10.  If the Program as you
+received it, or any part of it, contains a notice stating that it is
+governed by this License along with a term that is a further
+restriction, you may remove that term.  If a license document contains
+a further restriction but permits relicensing or conveying under this
+License, you may add to a covered work material governed by the terms
+of that license document, provided that the further restriction does
+not survive such relicensing or conveying.
+
+  If you add terms to a covered work in accord with this section, you
+must place, in the relevant source files, a statement of the
+additional terms that apply to those files, or a notice indicating
+where to find the applicable terms.
+
+  Additional terms, permissive or non-permissive, may be stated in the
+form of a separately written license, or stated as exceptions;
+the above requirements apply either way.
+
+  8. Termination.
+
+  You may not propagate or modify a covered work except as expressly
+provided under this License.  Any attempt otherwise to propagate or
+modify it is void, and will automatically terminate your rights under
+this License (including any patent licenses granted under the third
+paragraph of section 11).
+
+  However, if you cease all violation of this License, then your
+license from a particular copyright holder is reinstated (a)
+provisionally, unless and until the copyright holder explicitly and
+finally terminates your license, and (b) permanently, if the copyright
+holder fails to notify you of the violation by some reasonable means
+prior to 60 days after the cessation.
+
+  Moreover, your license from a particular copyright holder is
+reinstated permanently if the copyright holder notifies you of the
+violation by some reasonable means, this is the first time you have
+received notice of violation of this License (for any work) from that
+copyright holder, and you cure the violation prior to 30 days after
+your receipt of the notice.
+
+  Termination of your rights under this section does not terminate the
+licenses of parties who have received copies or rights from you under
+this License.  If your rights have been terminated and not permanently
+reinstated, you do not qualify to receive new licenses for the same
+material under section 10.
+
+  9. Acceptance Not Required for Having Copies.
+
+  You are not required to accept this License in order to receive or
+run a copy of the Program.  Ancillary propagation of a covered work
+occurring solely as a consequence of using peer-to-peer transmission
+to receive a copy likewise does not require acceptance.  However,
+nothing other than this License grants you permission to propagate or
+modify any covered work.  These actions infringe copyright if you do
+not accept this License.  Therefore, by modifying or propagating a
+covered work, you indicate your acceptance of this License to do so.
+
+  10. Automatic Licensing of Downstream Recipients.
+
+  Each time you convey a covered work, the recipient automatically
+receives a license from the original licensors, to run, modify and
+propagate that work, subject to this License.  You are not responsible
+for enforcing compliance by third parties with this License.
+
+  An "entity transaction" is a transaction transferring control of an
+organization, or substantially all assets of one, or subdividing an
+organization, or merging organizations.  If propagation of a covered
+work results from an entity transaction, each party to that
+transaction who receives a copy of the work also receives whatever
+licenses to the work the party's predecessor in interest had or could
+give under the previous paragraph, plus a right to possession of the
+Corresponding Source of the work from the predecessor in interest, if
+the predecessor has it or can get it with reasonable efforts.
+
+  You may not impose any further restrictions on the exercise of the
+rights granted or affirmed under this License.  For example, you may
+not impose a license fee, royalty, or other charge for exercise of
+rights granted under this License, and you may not initiate litigation
+(including a cross-claim or counterclaim in a lawsuit) alleging that
+any patent claim is infringed by making, using, selling, offering for
+sale, or importing the Program or any portion of it.
+
+  11. Patents.
+
+  A "contributor" is a copyright holder who authorizes use under this
+License of the Program or a work on which the Program is based.  The
+work thus licensed is called the contributor's "contributor version".
+
+  A contributor's "essential patent claims" are all patent claims
+owned or controlled by the contributor, whether already acquired or
+hereafter acquired, that would be infringed by some manner, permitted
+by this License, of making, using, or selling its contributor version,
+but do not include claims that would be infringed only as a
+consequence of further modification of the contributor version.  For
+purposes of this definition, "control" includes the right to grant
+patent sublicenses in a manner consistent with the requirements of
+this License.
+
+  Each contributor grants you a non-exclusive, worldwide, royalty-free
+patent license under the contributor's essential patent claims, to
+make, use, sell, offer for sale, import and otherwise run, modify and
+propagate the contents of its contributor version.
+
+  In the following three paragraphs, a "patent license" is any express
+agreement or commitment, however denominated, not to enforce a patent
+(such as an express permission to practice a patent or covenant not to
+sue for patent infringement).  To "grant" such a patent license to a
+party means to make such an agreement or commitment not to enforce a
+patent against the party.
+
+  If you convey a covered work, knowingly relying on a patent license,
+and the Corresponding Source of the work is not available for anyone
+to copy, free of charge and under the terms of this License, through a
+publicly available network server or other readily accessible means,
+then you must either (1) cause the Corresponding Source to be so
+available, or (2) arrange to deprive yourself of the benefit of the
+patent license for this particular work, or (3) arrange, in a manner
+consistent with the requirements of this License, to extend the patent
+license to downstream recipients.  "Knowingly relying" means you have
+actual knowledge that, but for the patent license, your conveying the
+covered work in a country, or your recipient's use of the covered work
+in a country, would infringe one or more identifiable patents in that
+country that you have reason to believe are valid.
+
+  If, pursuant to or in connection with a single transaction or
+arrangement, you convey, or propagate by procuring conveyance of, a
+covered work, and grant a patent license to some of the parties
+receiving the covered work authorizing them to use, propagate, modify
+or convey a specific copy of the covered work, then the patent license
+you grant is automatically extended to all recipients of the covered
+work and works based on it.
+
+  A patent license is "discriminatory" if it does not include within
+the scope of its coverage, prohibits the exercise of, or is
+conditioned on the non-exercise of one or more of the rights that are
+specifically granted under this License.  You may not convey a covered
+work if you are a party to an arrangement with a third party that is
+in the business of distributing software, under which you make payment
+to the third party based on the extent of your activity of conveying
+the work, and under which the third party grants, to any of the
+parties who would receive the covered work from you, a discriminatory
+patent license (a) in connection with copies of the covered work
+conveyed by you (or copies made from those copies), or (b) primarily
+for and in connection with specific products or compilations that
+contain the covered work, unless you entered into that arrangement,
+or that patent license was granted, prior to 28 March 2007.
+
+  Nothing in this License shall be construed as excluding or limiting
+any implied license or other defenses to infringement that may
+otherwise be available to you under applicable patent law.
+
+  12. No Surrender of Others' Freedom.
+
+  If conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot convey a
+covered work so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you may
+not convey it at all.  For example, if you agree to terms that obligate you
+to collect a royalty for further conveying from those to whom you convey
+the Program, the only way you could satisfy both those terms and this
+License would be to refrain entirely from conveying the Program.
+
+  13. Use with the GNU Affero General Public License.
+
+  Notwithstanding any other provision of this License, you have
+permission to link or combine any covered work with a work licensed
+under version 3 of the GNU Affero General Public License into a single
+combined work, and to convey the resulting work.  The terms of this
+License will continue to apply to the part which is the covered work,
+but the special requirements of the GNU Affero General Public License,
+section 13, concerning interaction through a network will apply to the
+combination as such.
+
+  14. Revised Versions of this License.
+
+  The Free Software Foundation may publish revised and/or new versions of
+the GNU General Public License from time to time.  Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+  Each version is given a distinguishing version number.  If the
+Program specifies that a certain numbered version of the GNU General
+Public License "or any later version" applies to it, you have the
+option of following the terms and conditions either of that numbered
+version or of any later version published by the Free Software
+Foundation.  If the Program does not specify a version number of the
+GNU General Public License, you may choose any version ever published
+by the Free Software Foundation.
+
+  If the Program specifies that a proxy can decide which future
+versions of the GNU General Public License can be used, that proxy's
+public statement of acceptance of a version permanently authorizes you
+to choose that version for the Program.
+
+  Later license versions may give you additional or different
+permissions.  However, no additional obligations are imposed on any
+author or copyright holder as a result of your choosing to follow a
+later version.
+
+  15. Disclaimer of Warranty.
+
+  THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY
+APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT
+HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY
+OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO,
+THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM
+IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF
+ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
+
+  16. Limitation of Liability.
+
+  IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS
+THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY
+GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE
+USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF
+DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD
+PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS),
+EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF
+SUCH DAMAGES.
+
+  17. Interpretation of Sections 15 and 16.
+
+  If the disclaimer of warranty and limitation of liability provided
+above cannot be given local legal effect according to their terms,
+reviewing courts shall apply local law that most closely approximates
+an absolute waiver of all civil liability in connection with the
+Program, unless a warranty or assumption of liability accompanies a
+copy of the Program in return for a fee.
+
+                     END OF TERMS AND CONDITIONS
+
+            How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+state the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This program is free software: you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation, either version 3 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License
+    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+Also add information on how to contact you by electronic and paper mail.
+
+  If the program does terminal interaction, make it output a short
+notice like this when it starts in an interactive mode:
+
+    <program>  Copyright (C) <year>  <name of author>
+    This program comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+    This is free software, and you are welcome to redistribute it
+    under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License.  Of course, your program's commands
+might be different; for a GUI interface, you would use an "about box".
+
+  You should also get your employer (if you work as a programmer) or school,
+if any, to sign a "copyright disclaimer" for the program, if necessary.
+For more information on this, and how to apply and follow the GNU GPL, see
+<http://www.gnu.org/licenses/>.
+
+  The GNU General Public License does not permit incorporating your program
+into proprietary programs.  If your program is a subroutine library, you
+may consider it more useful to permit linking proprietary applications with
+the library.  If this is what you want to do, use the GNU Lesser General
+Public License instead of this License.  But first, please read
+<http://www.gnu.org/philosophy/why-not-lgpl.html>.
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/ChangeLog
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/ChangeLog
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/INSTALL
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/INSTALL
@ -0,0 +1,237 @@
+Installation Instructions
+*************************
+
+Copyright (C) 1994, 1995, 1996, 1999, 2000, 2001, 2002, 2004, 2005,
+2006, 2007 Free Software Foundation, Inc.
+
+This file is free documentation; the Free Software Foundation gives
+unlimited permission to copy, distribute and modify it.
+
+Basic Installation
+==================
+
+Briefly, the shell commands `./configure; make; make install' should
+configure, build, and install this package.  The following
+more-detailed instructions are generic; see the `README' file for
+instructions specific to this package.
+
+   The `configure' shell script attempts to guess correct values for
+various system-dependent variables used during compilation.  It uses
+those values to create a `Makefile' in each directory of the package.
+It may also create one or more `.h' files containing system-dependent
+definitions.  Finally, it creates a shell script `config.status' that
+you can run in the future to recreate the current configuration, and a
+file `config.log' containing compiler output (useful mainly for
+debugging `configure').
+
+   It can also use an optional file (typically called `config.cache'
+and enabled with `--cache-file=config.cache' or simply `-C') that saves
+the results of its tests to speed up reconfiguring.  Caching is
+disabled by default to prevent problems with accidental use of stale
+cache files.
+
+   If you need to do unusual things to compile the package, please try
+to figure out how `configure' could check whether to do them, and mail
+diffs or instructions to the address given in the `README' so they can
+be considered for the next release.  If you are using the cache, and at
+some point `config.cache' contains results you don't want to keep, you
+may remove or edit it.
+
+   The file `configure.ac' (or `configure.in') is used to create
+`configure' by a program called `autoconf'.  You need `configure.ac' if
+you want to change it or regenerate `configure' using a newer version
+of `autoconf'.
+
+The simplest way to compile this package is:
+
+  1. `cd' to the directory containing the package's source code and type
+     `./configure' to configure the package for your system.
+
+     Running `configure' might take a while.  While running, it prints
+     some messages telling which features it is checking for.
+
+  2. Type `make' to compile the package.
+
+  3. Optionally, type `make check' to run any self-tests that come with
+     the package.
+
+  4. Type `make install' to install the programs and any data files and
+     documentation.
+
+  5. You can remove the program binaries and object files from the
+     source code directory by typing `make clean'.  To also remove the
+     files that `configure' created (so you can compile the package for
+     a different kind of computer), type `make distclean'.  There is
+     also a `make maintainer-clean' target, but that is intended mainly
+     for the package's developers.  If you use it, you may have to get
+     all sorts of other programs in order to regenerate files that came
+     with the distribution.
+
+  6. Often, you can also type `make uninstall' to remove the installed
+     files again.
+
+Compilers and Options
+=====================
+
+Some systems require unusual options for compilation or linking that the
+`configure' script does not know about.  Run `./configure --help' for
+details on some of the pertinent environment variables.
+
+   You can give `configure' initial values for configuration parameters
+by setting variables in the command line or in the environment.  Here
+is an example:
+
+     ./configure CC=c99 CFLAGS=-g LIBS=-lposix
+
+   *Note Defining Variables::, for more details.
+
+Compiling For Multiple Architectures
+====================================
+
+You can compile the package for more than one kind of computer at the
+same time, by placing the object files for each architecture in their
+own directory.  To do this, you can use GNU `make'.  `cd' to the
+directory where you want the object files and executables to go and run
+the `configure' script.  `configure' automatically checks for the
+source code in the directory that `configure' is in and in `..'.
+
+   With a non-GNU `make', it is safer to compile the package for one
+architecture at a time in the source code directory.  After you have
+installed the package for one architecture, use `make distclean' before
+reconfiguring for another architecture.
+
+Installation Names
+==================
+
+By default, `make install' installs the package's commands under
+`/usr/local/bin', include files under `/usr/local/include', etc.  You
+can specify an installation prefix other than `/usr/local' by giving
+`configure' the option `--prefix=PREFIX'.
+
+   You can specify separate installation prefixes for
+architecture-specific files and architecture-independent files.  If you
+pass the option `--exec-prefix=PREFIX' to `configure', the package uses
+PREFIX as the prefix for installing programs and libraries.
+Documentation and other data files still use the regular prefix.
+
+   In addition, if you use an unusual directory layout you can give
+options like `--bindir=DIR' to specify different values for particular
+kinds of files.  Run `configure --help' for a list of the directories
+you can set and what kinds of files go in them.
+
+   If the package supports it, you can cause programs to be installed
+with an extra prefix or suffix on their names by giving `configure' the
+option `--program-prefix=PREFIX' or `--program-suffix=SUFFIX'.
+
+Optional Features
+=================
+
+Some packages pay attention to `--enable-FEATURE' options to
+`configure', where FEATURE indicates an optional part of the package.
+They may also pay attention to `--with-PACKAGE' options, where PACKAGE
+is something like `gnu-as' or `x' (for the X Window System).  The
+`README' should mention any `--enable-' and `--with-' options that the
+package recognizes.
+
+   For packages that use the X Window System, `configure' can usually
+find the X include and library files automatically, but if it doesn't,
+you can use the `configure' options `--x-includes=DIR' and
+`--x-libraries=DIR' to specify their locations.
+
+Specifying the System Type
+==========================
+
+There may be some features `configure' cannot figure out automatically,
+but needs to determine by the type of machine the package will run on.
+Usually, assuming the package is built to be run on the _same_
+architectures, `configure' can figure that out, but if it prints a
+message saying it cannot guess the machine type, give it the
+`--build=TYPE' option.  TYPE can either be a short name for the system
+type, such as `sun4', or a canonical name which has the form:
+
+     CPU-COMPANY-SYSTEM
+
+where SYSTEM can have one of these forms:
+
+     OS KERNEL-OS
+
+   See the file `config.sub' for the possible values of each field.  If
+`config.sub' isn't included in this package, then this package doesn't
+need to know the machine type.
+
+   If you are _building_ compiler tools for cross-compiling, you should
+use the option `--target=TYPE' to select the type of system they will
+produce code for.
+
+   If you want to _use_ a cross compiler, that generates code for a
+platform different from the build platform, you should specify the
+"host" platform (i.e., that on which the generated programs will
+eventually be run) with `--host=TYPE'.
+
+Sharing Defaults
+================
+
+If you want to set default values for `configure' scripts to share, you
+can create a site shell script called `config.site' that gives default
+values for variables like `CC', `cache_file', and `prefix'.
+`configure' looks for `PREFIX/share/config.site' if it exists, then
+`PREFIX/etc/config.site' if it exists.  Or, you can set the
+`CONFIG_SITE' environment variable to the location of the site script.
+A warning: not all `configure' scripts look for a site script.
+
+Defining Variables
+==================
+
+Variables not defined in a site shell script can be set in the
+environment passed to `configure'.  However, some packages may run
+configure again during the build, and the customized values of these
+variables may be lost.  In order to avoid this problem, you should set
+them in the `configure' command line, using `VAR=value'.  For example:
+
+     ./configure CC=/usr/local2/bin/gcc
+
+causes the specified `gcc' to be used as the C compiler (unless it is
+overridden in the site shell script).
+
+Unfortunately, this technique does not work for `CONFIG_SHELL' due to
+an Autoconf bug.  Until the bug is fixed you can use this workaround:
+
+     CONFIG_SHELL=/bin/bash /bin/bash ./configure CONFIG_SHELL=/bin/bash
+
+`configure' Invocation
+======================
+
+`configure' recognizes the following options to control how it operates.
+
+`--help'
+`-h'
+     Print a summary of the options to `configure', and exit.
+
+`--version'
+`-V'
+     Print the version of Autoconf used to generate the `configure'
+     script, and exit.
+
+`--cache-file=FILE'
+     Enable the cache: use and save the results of the tests in FILE,
+     traditionally `config.cache'.  FILE defaults to `/dev/null' to
+     disable caching.
+
+`--config-cache'
+`-C'
+     Alias for `--cache-file=config.cache'.
+
+`--quiet'
+`--silent'
+`-q'
+     Do not print messages saying which checks are being made.  To
+     suppress all normal output, redirect it to `/dev/null' (any error
+     messages will still be shown).
+
+`--srcdir=DIR'
+     Look for the package's source code in directory DIR.  Usually
+     `configure' can determine that directory automatically.
+
+`configure' also accepts some other, not widely useful, options.  Run
+`configure --help' for more details.
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/Makefile.am
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/Makefile.am
@ -0,0 +1,29 @@
+## Process this file with automake to produce Makefile.in
+## Created by Anjuta
+
+SUBDIRS = src 
+
+mgizadocdir = ${prefix}/doc/mgiza
+mgizadoc_DATA = \
+	README\
+	COPYING\
+	AUTHORS\
+	ChangeLog\
+	INSTALL\
+	NEWS
+
+mgizascriptsdir = ${prefix}/scripts/
+
+mgizascripts_SCRIPTS = \
+				   scripts/*
+
+EXTRA_DIST = $(mgizadoc_DATA) \
+	         ${mgizascripts_SCRIPTS}
+# Copy all the spec files. Of cource, only one is actually used.
+dist-hook:
+	for specfile in *.spec; do \
+		if test -f $$specfile; then \
+			cp -p $$specfile $(distdir); \
+		fi \
+	done
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/Makefile.in
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/Makefile.in
@ -0,0 +1,683 @@
+# Makefile.in generated by automake 1.10.1 from Makefile.am.
+# @configure_input@
+
+# Copyright (C) 1994, 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002,
+# 2003, 2004, 2005, 2006, 2007, 2008  Free Software Foundation, Inc.
+# This Makefile.in is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY, to the extent permitted by law; without
+# even the implied warranty of MERCHANTABILITY or FITNESS FOR A
+# PARTICULAR PURPOSE.
+
+@SET_MAKE@
+
+
+VPATH = @srcdir@
+pkgdatadir = $(datadir)/@PACKAGE@
+pkglibdir = $(libdir)/@PACKAGE@
+pkgincludedir = $(includedir)/@PACKAGE@
+am__cd = CDPATH="$${ZSH_VERSION+.}$(PATH_SEPARATOR)" && cd
+install_sh_DATA = $(install_sh) -c -m 644
+install_sh_PROGRAM = $(install_sh) -c
+install_sh_SCRIPT = $(install_sh) -c
+INSTALL_HEADER = $(INSTALL_DATA)
+transform = $(program_transform_name)
+NORMAL_INSTALL = :
+PRE_INSTALL = :
+POST_INSTALL = :
+NORMAL_UNINSTALL = :
+PRE_UNINSTALL = :
+POST_UNINSTALL = :
+subdir = .
+DIST_COMMON = README $(am__configure_deps) $(srcdir)/Makefile.am \
+	$(srcdir)/Makefile.in $(srcdir)/config.h.in \
+	$(top_srcdir)/configure AUTHORS COPYING ChangeLog INSTALL NEWS \
+	config.guess config.sub depcomp install-sh ltmain.sh missing
+ACLOCAL_M4 = $(top_srcdir)/aclocal.m4
+am__aclocal_m4_deps = $(top_srcdir)/configure.ac
+am__configure_deps = $(am__aclocal_m4_deps) $(CONFIGURE_DEPENDENCIES) \
+	$(ACLOCAL_M4)
+am__CONFIG_DISTCLEAN_FILES = config.status config.cache config.log \
+ configure.lineno config.status.lineno
+mkinstalldirs = $(install_sh) -d
+CONFIG_HEADER = config.h
+CONFIG_CLEAN_FILES =
+am__installdirs = "$(DESTDIR)$(mgizascriptsdir)" \
+	"$(DESTDIR)$(mgizadocdir)"
+mgizascriptsSCRIPT_INSTALL = $(INSTALL_SCRIPT)
+SCRIPTS = $(mgizascripts_SCRIPTS)
+SOURCES =
+DIST_SOURCES =
+RECURSIVE_TARGETS = all-recursive check-recursive dvi-recursive \
+	html-recursive info-recursive install-data-recursive \
+	install-dvi-recursive install-exec-recursive \
+	install-html-recursive install-info-recursive \
+	install-pdf-recursive install-ps-recursive install-recursive \
+	installcheck-recursive installdirs-recursive pdf-recursive \
+	ps-recursive uninstall-recursive
+am__vpath_adj_setup = srcdirstrip=`echo "$(srcdir)" | sed 's|.|.|g'`;
+am__vpath_adj = case $$p in \
+    $(srcdir)/*) f=`echo "$$p" | sed "s|^$$srcdirstrip/||"`;; \
+    *) f=$$p;; \
+  esac;
+am__strip_dir = `echo $$p | sed -e 's|^.*/||'`;
+mgizadocDATA_INSTALL = $(INSTALL_DATA)
+DATA = $(mgizadoc_DATA)
+RECURSIVE_CLEAN_TARGETS = mostlyclean-recursive clean-recursive	\
+  distclean-recursive maintainer-clean-recursive
+ETAGS = etags
+CTAGS = ctags
+DIST_SUBDIRS = $(SUBDIRS)
+DISTFILES = $(DIST_COMMON) $(DIST_SOURCES) $(TEXINFOS) $(EXTRA_DIST)
+distdir = $(PACKAGE)-$(VERSION)
+top_distdir = $(distdir)
+am__remove_distdir = \
+  { test ! -d $(distdir) \
+    || { find $(distdir) -type d ! -perm -200 -exec chmod u+w {} ';' \
+         && rm -fr $(distdir); }; }
+DIST_ARCHIVES = $(distdir).tar.gz
+GZIP_ENV = --best
+distuninstallcheck_listfiles = find . -type f -print
+distcleancheck_listfiles = find . -type f -print
+ACLOCAL = @ACLOCAL@
+AMTAR = @AMTAR@
+AUTOCONF = @AUTOCONF@
+AUTOHEADER = @AUTOHEADER@
+AUTOMAKE = @AUTOMAKE@
+AWK = @AWK@
+CC = @CC@
+CCDEPMODE = @CCDEPMODE@
+CFLAGS = @CFLAGS@
+CPP = @CPP@
+CPPFLAGS = @CPPFLAGS@
+CXX = @CXX@
+CXXDEPMODE = @CXXDEPMODE@
+CXXFLAGS = @CXXFLAGS@
+CYGPATH_W = @CYGPATH_W@
+DEFS = @DEFS@
+DEPDIR = @DEPDIR@
+ECHO_C = @ECHO_C@
+ECHO_N = @ECHO_N@
+ECHO_T = @ECHO_T@
+EGREP = @EGREP@
+EXEEXT = @EXEEXT@
+GREP = @GREP@
+INSTALL = @INSTALL@
+INSTALL_DATA = @INSTALL_DATA@
+INSTALL_PROGRAM = @INSTALL_PROGRAM@
+INSTALL_SCRIPT = @INSTALL_SCRIPT@
+INSTALL_STRIP_PROGRAM = @INSTALL_STRIP_PROGRAM@
+LDFLAGS = @LDFLAGS@
+LIBOBJS = @LIBOBJS@
+LIBS = @LIBS@
+LTLIBOBJS = @LTLIBOBJS@
+MAINT = @MAINT@
+MAKEINFO = @MAKEINFO@
+MKDIR_P = @MKDIR_P@
+OBJEXT = @OBJEXT@
+PACKAGE = @PACKAGE@
+PACKAGE_BUGREPORT = @PACKAGE_BUGREPORT@
+PACKAGE_NAME = @PACKAGE_NAME@
+PACKAGE_STRING = @PACKAGE_STRING@
+PACKAGE_TARNAME = @PACKAGE_TARNAME@
+PACKAGE_VERSION = @PACKAGE_VERSION@
+PATH_SEPARATOR = @PATH_SEPARATOR@
+RANLIB = @RANLIB@
+SET_MAKE = @SET_MAKE@
+SHELL = @SHELL@
+STRIP = @STRIP@
+VERSION = @VERSION@
+abs_builddir = @abs_builddir@
+abs_srcdir = @abs_srcdir@
+abs_top_builddir = @abs_top_builddir@
+abs_top_srcdir = @abs_top_srcdir@
+ac_ct_CC = @ac_ct_CC@
+ac_ct_CXX = @ac_ct_CXX@
+am__include = @am__include@
+am__leading_dot = @am__leading_dot@
+am__quote = @am__quote@
+am__tar = @am__tar@
+am__untar = @am__untar@
+bindir = @bindir@
+build_alias = @build_alias@
+builddir = @builddir@
+datadir = @datadir@
+datarootdir = @datarootdir@
+docdir = @docdir@
+dvidir = @dvidir@
+exec_prefix = @exec_prefix@
+host_alias = @host_alias@
+htmldir = @htmldir@
+includedir = @includedir@
+infodir = @infodir@
+install_sh = @install_sh@
+libdir = @libdir@
+libexecdir = @libexecdir@
+localedir = @localedir@
+localstatedir = @localstatedir@
+mandir = @mandir@
+mkdir_p = @mkdir_p@
+oldincludedir = @oldincludedir@
+pdfdir = @pdfdir@
+prefix = @prefix@
+program_transform_name = @program_transform_name@
+psdir = @psdir@
+sbindir = @sbindir@
+sharedstatedir = @sharedstatedir@
+srcdir = @srcdir@
+sysconfdir = @sysconfdir@
+target_alias = @target_alias@
+top_build_prefix = @top_build_prefix@
+top_builddir = @top_builddir@
+top_srcdir = @top_srcdir@
+SUBDIRS = src 
+mgizadocdir = ${prefix}/doc/mgiza
+mgizadoc_DATA = \
+	README\
+	COPYING\
+	AUTHORS\
+	ChangeLog\
+	INSTALL\
+	NEWS
+
+mgizascriptsdir = ${prefix}/scripts/
+mgizascripts_SCRIPTS = \
+				   scripts/*
+
+EXTRA_DIST = $(mgizadoc_DATA) \
+	         ${mgizascripts_SCRIPTS}
+
+all: config.h
+	$(MAKE) $(AM_MAKEFLAGS) all-recursive
+
+.SUFFIXES:
+am--refresh:
+	@:
+$(srcdir)/Makefile.in: @MAINTAINER_MODE_TRUE@ $(srcdir)/Makefile.am  $(am__configure_deps)
+	@for dep in $?; do \
+	  case '$(am__configure_deps)' in \
+	    *$$dep*) \
+	      echo ' cd $(srcdir) && $(AUTOMAKE) --gnu '; \
+	      cd $(srcdir) && $(AUTOMAKE) --gnu  \
+		&& exit 0; \
+	      exit 1;; \
+	  esac; \
+	done; \
+	echo ' cd $(top_srcdir) && $(AUTOMAKE) --gnu  Makefile'; \
+	cd $(top_srcdir) && \
+	  $(AUTOMAKE) --gnu  Makefile
+.PRECIOUS: Makefile
+Makefile: $(srcdir)/Makefile.in $(top_builddir)/config.status
+	@case '$?' in \
+	  *config.status*) \
+	    echo ' $(SHELL) ./config.status'; \
+	    $(SHELL) ./config.status;; \
+	  *) \
+	    echo ' cd $(top_builddir) && $(SHELL) ./config.status $@ $(am__depfiles_maybe)'; \
+	    cd $(top_builddir) && $(SHELL) ./config.status $@ $(am__depfiles_maybe);; \
+	esac;
+
+$(top_builddir)/config.status: $(top_srcdir)/configure $(CONFIG_STATUS_DEPENDENCIES)
+	$(SHELL) ./config.status --recheck
+
+$(top_srcdir)/configure: @MAINTAINER_MODE_TRUE@ $(am__configure_deps)
+	cd $(srcdir) && $(AUTOCONF)
+$(ACLOCAL_M4): @MAINTAINER_MODE_TRUE@ $(am__aclocal_m4_deps)
+	cd $(srcdir) && $(ACLOCAL) $(ACLOCAL_AMFLAGS)
+
+config.h: stamp-h1
+	@if test ! -f $@; then \
+	  rm -f stamp-h1; \
+	  $(MAKE) $(AM_MAKEFLAGS) stamp-h1; \
+	else :; fi
+
+stamp-h1: $(srcdir)/config.h.in $(top_builddir)/config.status
+	@rm -f stamp-h1
+	cd $(top_builddir) && $(SHELL) ./config.status config.h
+$(srcdir)/config.h.in: @MAINTAINER_MODE_TRUE@ $(am__configure_deps) 
+	cd $(top_srcdir) && $(AUTOHEADER)
+	rm -f stamp-h1
+	touch $@
+
+distclean-hdr:
+	-rm -f config.h stamp-h1
+install-mgizascriptsSCRIPTS: $(mgizascripts_SCRIPTS)
+	@$(NORMAL_INSTALL)
+	test -z "$(mgizascriptsdir)" || $(MKDIR_P) "$(DESTDIR)$(mgizascriptsdir)"
+	@list='$(mgizascripts_SCRIPTS)'; for p in $$list; do \
+	  if test -f "$$p"; then d=; else d="$(srcdir)/"; fi; \
+	  if test -f $$d$$p; then \
+	    f=`echo "$$p" | sed 's|^.*/||;$(transform)'`; \
+	    echo " $(mgizascriptsSCRIPT_INSTALL) '$$d$$p' '$(DESTDIR)$(mgizascriptsdir)/$$f'"; \
+	    $(mgizascriptsSCRIPT_INSTALL) "$$d$$p" "$(DESTDIR)$(mgizascriptsdir)/$$f"; \
+	  else :; fi; \
+	done
+
+uninstall-mgizascriptsSCRIPTS:
+	@$(NORMAL_UNINSTALL)
+	@list='$(mgizascripts_SCRIPTS)'; for p in $$list; do \
+	  f=`echo "$$p" | sed 's|^.*/||;$(transform)'`; \
+	  echo " rm -f '$(DESTDIR)$(mgizascriptsdir)/$$f'"; \
+	  rm -f "$(DESTDIR)$(mgizascriptsdir)/$$f"; \
+	done
+install-mgizadocDATA: $(mgizadoc_DATA)
+	@$(NORMAL_INSTALL)
+	test -z "$(mgizadocdir)" || $(MKDIR_P) "$(DESTDIR)$(mgizadocdir)"
+	@list='$(mgizadoc_DATA)'; for p in $$list; do \
+	  if test -f "$$p"; then d=; else d="$(srcdir)/"; fi; \
+	  f=$(am__strip_dir) \
+	  echo " $(mgizadocDATA_INSTALL) '$$d$$p' '$(DESTDIR)$(mgizadocdir)/$$f'"; \
+	  $(mgizadocDATA_INSTALL) "$$d$$p" "$(DESTDIR)$(mgizadocdir)/$$f"; \
+	done
+
+uninstall-mgizadocDATA:
+	@$(NORMAL_UNINSTALL)
+	@list='$(mgizadoc_DATA)'; for p in $$list; do \
+	  f=$(am__strip_dir) \
+	  echo " rm -f '$(DESTDIR)$(mgizadocdir)/$$f'"; \
+	  rm -f "$(DESTDIR)$(mgizadocdir)/$$f"; \
+	done
+
+# This directory's subdirectories are mostly independent; you can cd
+# into them and run `make' without going through this Makefile.
+# To change the values of `make' variables: instead of editing Makefiles,
+# (1) if the variable is set in `config.status', edit `config.status'
+#     (which will cause the Makefiles to be regenerated when you run `make');
+# (2) otherwise, pass the desired values on the `make' command line.
+$(RECURSIVE_TARGETS):
+	@failcom='exit 1'; \
+	for f in x $$MAKEFLAGS; do \
+	  case $$f in \
+	    *=* | --[!k]*);; \
+	    *k*) failcom='fail=yes';; \
+	  esac; \
+	done; \
+	dot_seen=no; \
+	target=`echo $@ | sed s/-recursive//`; \
+	list='$(SUBDIRS)'; for subdir in $$list; do \
+	  echo "Making $$target in $$subdir"; \
+	  if test "$$subdir" = "."; then \
+	    dot_seen=yes; \
+	    local_target="$$target-am"; \
+	  else \
+	    local_target="$$target"; \
+	  fi; \
+	  (cd $$subdir && $(MAKE) $(AM_MAKEFLAGS) $$local_target) \
+	  || eval $$failcom; \
+	done; \
+	if test "$$dot_seen" = "no"; then \
+	  $(MAKE) $(AM_MAKEFLAGS) "$$target-am" || exit 1; \
+	fi; test -z "$$fail"
+
+$(RECURSIVE_CLEAN_TARGETS):
+	@failcom='exit 1'; \
+	for f in x $$MAKEFLAGS; do \
+	  case $$f in \
+	    *=* | --[!k]*);; \
+	    *k*) failcom='fail=yes';; \
+	  esac; \
+	done; \
+	dot_seen=no; \
+	case "$@" in \
+	  distclean-* | maintainer-clean-*) list='$(DIST_SUBDIRS)' ;; \
+	  *) list='$(SUBDIRS)' ;; \
+	esac; \
+	rev=''; for subdir in $$list; do \
+	  if test "$$subdir" = "."; then :; else \
+	    rev="$$subdir $$rev"; \
+	  fi; \
+	done; \
+	rev="$$rev ."; \
+	target=`echo $@ | sed s/-recursive//`; \
+	for subdir in $$rev; do \
+	  echo "Making $$target in $$subdir"; \
+	  if test "$$subdir" = "."; then \
+	    local_target="$$target-am"; \
+	  else \
+	    local_target="$$target"; \
+	  fi; \
+	  (cd $$subdir && $(MAKE) $(AM_MAKEFLAGS) $$local_target) \
+	  || eval $$failcom; \
+	done && test -z "$$fail"
+tags-recursive:
+	list='$(SUBDIRS)'; for subdir in $$list; do \
+	  test "$$subdir" = . || (cd $$subdir && $(MAKE) $(AM_MAKEFLAGS) tags); \
+	done
+ctags-recursive:
+	list='$(SUBDIRS)'; for subdir in $$list; do \
+	  test "$$subdir" = . || (cd $$subdir && $(MAKE) $(AM_MAKEFLAGS) ctags); \
+	done
+
+ID: $(HEADERS) $(SOURCES) $(LISP) $(TAGS_FILES)
+	list='$(SOURCES) $(HEADERS) $(LISP) $(TAGS_FILES)'; \
+	unique=`for i in $$list; do \
+	    if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
+	  done | \
+	  $(AWK) '{ files[$$0] = 1; nonemtpy = 1; } \
+	      END { if (nonempty) { for (i in files) print i; }; }'`; \
+	mkid -fID $$unique
+tags: TAGS
+
+TAGS: tags-recursive $(HEADERS) $(SOURCES) config.h.in $(TAGS_DEPENDENCIES) \
+		$(TAGS_FILES) $(LISP)
+	tags=; \
+	here=`pwd`; \
+	if ($(ETAGS) --etags-include --version) >/dev/null 2>&1; then \
+	  include_option=--etags-include; \
+	  empty_fix=.; \
+	else \
+	  include_option=--include; \
+	  empty_fix=; \
+	fi; \
+	list='$(SUBDIRS)'; for subdir in $$list; do \
+	  if test "$$subdir" = .; then :; else \
+	    test ! -f $$subdir/TAGS || \
+	      tags="$$tags $$include_option=$$here/$$subdir/TAGS"; \
+	  fi; \
+	done; \
+	list='$(SOURCES) $(HEADERS) config.h.in $(LISP) $(TAGS_FILES)'; \
+	unique=`for i in $$list; do \
+	    if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
+	  done | \
+	  $(AWK) '{ files[$$0] = 1; nonempty = 1; } \
+	      END { if (nonempty) { for (i in files) print i; }; }'`; \
+	if test -z "$(ETAGS_ARGS)$$tags$$unique"; then :; else \
+	  test -n "$$unique" || unique=$$empty_fix; \
+	  $(ETAGS) $(ETAGSFLAGS) $(AM_ETAGSFLAGS) $(ETAGS_ARGS) \
+	    $$tags $$unique; \
+	fi
+ctags: CTAGS
+CTAGS: ctags-recursive $(HEADERS) $(SOURCES) config.h.in $(TAGS_DEPENDENCIES) \
+		$(TAGS_FILES) $(LISP)
+	tags=; \
+	list='$(SOURCES) $(HEADERS) config.h.in $(LISP) $(TAGS_FILES)'; \
+	unique=`for i in $$list; do \
+	    if test -f "$$i"; then echo $$i; else echo $(srcdir)/$$i; fi; \
+	  done | \
+	  $(AWK) '{ files[$$0] = 1; nonempty = 1; } \
+	      END { if (nonempty) { for (i in files) print i; }; }'`; \
+	test -z "$(CTAGS_ARGS)$$tags$$unique" \
+	  || $(CTAGS) $(CTAGSFLAGS) $(AM_CTAGSFLAGS) $(CTAGS_ARGS) \
+	     $$tags $$unique
+
+GTAGS:
+	here=`$(am__cd) $(top_builddir) && pwd` \
+	  && cd $(top_srcdir) \
+	  && gtags -i $(GTAGS_ARGS) $$here
+
+distclean-tags:
+	-rm -f TAGS ID GTAGS GRTAGS GSYMS GPATH tags
+
+distdir: $(DISTFILES)
+	$(am__remove_distdir)
+	test -d $(distdir) || mkdir $(distdir)
+	@srcdirstrip=`echo "$(srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
+	topsrcdirstrip=`echo "$(top_srcdir)" | sed 's/[].[^$$\\*]/\\\\&/g'`; \
+	list='$(DISTFILES)'; \
+	  dist_files=`for file in $$list; do echo $$file; done | \
+	  sed -e "s|^$$srcdirstrip/||;t" \
+	      -e "s|^$$topsrcdirstrip/|$(top_builddir)/|;t"`; \
+	case $$dist_files in \
+	  */*) $(MKDIR_P) `echo "$$dist_files" | \
+			   sed '/\//!d;s|^|$(distdir)/|;s,/[^/]*$$,,' | \
+			   sort -u` ;; \
+	esac; \
+	for file in $$dist_files; do \
+	  if test -f $$file || test -d $$file; then d=.; else d=$(srcdir); fi; \
+	  if test -d $$d/$$file; then \
+	    dir=`echo "/$$file" | sed -e 's,/[^/]*$$,,'`; \
+	    if test -d $(srcdir)/$$file && test $$d != $(srcdir); then \
+	      cp -pR $(srcdir)/$$file $(distdir)$$dir || exit 1; \
+	    fi; \
+	    cp -pR $$d/$$file $(distdir)$$dir || exit 1; \
+	  else \
+	    test -f $(distdir)/$$file \
+	    || cp -p $$d/$$file $(distdir)/$$file \
+	    || exit 1; \
+	  fi; \
+	done
+	list='$(DIST_SUBDIRS)'; for subdir in $$list; do \
+	  if test "$$subdir" = .; then :; else \
+	    test -d "$(distdir)/$$subdir" \
+	    || $(MKDIR_P) "$(distdir)/$$subdir" \
+	    || exit 1; \
+	    distdir=`$(am__cd) $(distdir) && pwd`; \
+	    top_distdir=`$(am__cd) $(top_distdir) && pwd`; \
+	    (cd $$subdir && \
+	      $(MAKE) $(AM_MAKEFLAGS) \
+	        top_distdir="$$top_distdir" \
+	        distdir="$$distdir/$$subdir" \
+		am__remove_distdir=: \
+		am__skip_length_check=: \
+	        distdir) \
+	      || exit 1; \
+	  fi; \
+	done
+	$(MAKE) $(AM_MAKEFLAGS) \
+	  top_distdir="$(top_distdir)" distdir="$(distdir)" \
+	  dist-hook
+	-find $(distdir) -type d ! -perm -777 -exec chmod a+rwx {} \; -o \
+	  ! -type d ! -perm -444 -links 1 -exec chmod a+r {} \; -o \
+	  ! -type d ! -perm -400 -exec chmod a+r {} \; -o \
+	  ! -type d ! -perm -444 -exec $(install_sh) -c -m a+r {} {} \; \
+	|| chmod -R a+r $(distdir)
+dist-gzip: distdir
+	tardir=$(distdir) && $(am__tar) | GZIP=$(GZIP_ENV) gzip -c >$(distdir).tar.gz
+	$(am__remove_distdir)
+
+dist-bzip2: distdir
+	tardir=$(distdir) && $(am__tar) | bzip2 -9 -c >$(distdir).tar.bz2
+	$(am__remove_distdir)
+
+dist-lzma: distdir
+	tardir=$(distdir) && $(am__tar) | lzma -9 -c >$(distdir).tar.lzma
+	$(am__remove_distdir)
+
+dist-tarZ: distdir
+	tardir=$(distdir) && $(am__tar) | compress -c >$(distdir).tar.Z
+	$(am__remove_distdir)
+
+dist-shar: distdir
+	shar $(distdir) | GZIP=$(GZIP_ENV) gzip -c >$(distdir).shar.gz
+	$(am__remove_distdir)
+
+dist-zip: distdir
+	-rm -f $(distdir).zip
+	zip -rq $(distdir).zip $(distdir)
+	$(am__remove_distdir)
+
+dist dist-all: distdir
+	tardir=$(distdir) && $(am__tar) | GZIP=$(GZIP_ENV) gzip -c >$(distdir).tar.gz
+	$(am__remove_distdir)
+
+# This target untars the dist file and tries a VPATH configuration.  Then
+# it guarantees that the distribution is self-contained by making another
+# tarfile.
+distcheck: dist
+	case '$(DIST_ARCHIVES)' in \
+	*.tar.gz*) \
+	  GZIP=$(GZIP_ENV) gunzip -c $(distdir).tar.gz | $(am__untar) ;;\
+	*.tar.bz2*) \
+	  bunzip2 -c $(distdir).tar.bz2 | $(am__untar) ;;\
+	*.tar.lzma*) \
+	  unlzma -c $(distdir).tar.lzma | $(am__untar) ;;\
+	*.tar.Z*) \
+	  uncompress -c $(distdir).tar.Z | $(am__untar) ;;\
+	*.shar.gz*) \
+	  GZIP=$(GZIP_ENV) gunzip -c $(distdir).shar.gz | unshar ;;\
+	*.zip*) \
+	  unzip $(distdir).zip ;;\
+	esac
+	chmod -R a-w $(distdir); chmod a+w $(distdir)
+	mkdir $(distdir)/_build
+	mkdir $(distdir)/_inst
+	chmod a-w $(distdir)
+	dc_install_base=`$(am__cd) $(distdir)/_inst && pwd | sed -e 's,^[^:\\/]:[\\/],/,'` \
+	  && dc_destdir="$${TMPDIR-/tmp}/am-dc-$$$$/" \
+	  && cd $(distdir)/_build \
+	  && ../configure --srcdir=.. --prefix="$$dc_install_base" \
+	    $(DISTCHECK_CONFIGURE_FLAGS) \
+	  && $(MAKE) $(AM_MAKEFLAGS) \
+	  && $(MAKE) $(AM_MAKEFLAGS) dvi \
+	  && $(MAKE) $(AM_MAKEFLAGS) check \
+	  && $(MAKE) $(AM_MAKEFLAGS) install \
+	  && $(MAKE) $(AM_MAKEFLAGS) installcheck \
+	  && $(MAKE) $(AM_MAKEFLAGS) uninstall \
+	  && $(MAKE) $(AM_MAKEFLAGS) distuninstallcheck_dir="$$dc_install_base" \
+	        distuninstallcheck \
+	  && chmod -R a-w "$$dc_install_base" \
+	  && ({ \
+	       (cd ../.. && umask 077 && mkdir "$$dc_destdir") \
+	       && $(MAKE) $(AM_MAKEFLAGS) DESTDIR="$$dc_destdir" install \
+	       && $(MAKE) $(AM_MAKEFLAGS) DESTDIR="$$dc_destdir" uninstall \
+	       && $(MAKE) $(AM_MAKEFLAGS) DESTDIR="$$dc_destdir" \
+	            distuninstallcheck_dir="$$dc_destdir" distuninstallcheck; \
+	      } || { rm -rf "$$dc_destdir"; exit 1; }) \
+	  && rm -rf "$$dc_destdir" \
+	  && $(MAKE) $(AM_MAKEFLAGS) dist \
+	  && rm -rf $(DIST_ARCHIVES) \
+	  && $(MAKE) $(AM_MAKEFLAGS) distcleancheck
+	$(am__remove_distdir)
+	@(echo "$(distdir) archives ready for distribution: "; \
+	  list='$(DIST_ARCHIVES)'; for i in $$list; do echo $$i; done) | \
+	  sed -e 1h -e 1s/./=/g -e 1p -e 1x -e '$$p' -e '$$x'
+distuninstallcheck:
+	@cd $(distuninstallcheck_dir) \
+	&& test `$(distuninstallcheck_listfiles) | wc -l` -le 1 \
+	   || { echo "ERROR: files left after uninstall:" ; \
+	        if test -n "$(DESTDIR)"; then \
+	          echo "  (check DESTDIR support)"; \
+	        fi ; \
+	        $(distuninstallcheck_listfiles) ; \
+	        exit 1; } >&2
+distcleancheck: distclean
+	@if test '$(srcdir)' = . ; then \
+	  echo "ERROR: distcleancheck can only run from a VPATH build" ; \
+	  exit 1 ; \
+	fi
+	@test `$(distcleancheck_listfiles) | wc -l` -eq 0 \
+	  || { echo "ERROR: files left in build directory after distclean:" ; \
+	       $(distcleancheck_listfiles) ; \
+	       exit 1; } >&2
+check-am: all-am
+check: check-recursive
+all-am: Makefile $(SCRIPTS) $(DATA) config.h
+installdirs: installdirs-recursive
+installdirs-am:
+	for dir in "$(DESTDIR)$(mgizascriptsdir)" "$(DESTDIR)$(mgizadocdir)"; do \
+	  test -z "$$dir" || $(MKDIR_P) "$$dir"; \
+	done
+install: install-recursive
+install-exec: install-exec-recursive
+install-data: install-data-recursive
+uninstall: uninstall-recursive
+
+install-am: all-am
+	@$(MAKE) $(AM_MAKEFLAGS) install-exec-am install-data-am
+
+installcheck: installcheck-recursive
+install-strip:
+	$(MAKE) $(AM_MAKEFLAGS) INSTALL_PROGRAM="$(INSTALL_STRIP_PROGRAM)" \
+	  install_sh_PROGRAM="$(INSTALL_STRIP_PROGRAM)" INSTALL_STRIP_FLAG=-s \
+	  `test -z '$(STRIP)' || \
+	    echo "INSTALL_PROGRAM_ENV=STRIPPROG='$(STRIP)'"` install
+mostlyclean-generic:
+
+clean-generic:
+
+distclean-generic:
+	-test -z "$(CONFIG_CLEAN_FILES)" || rm -f $(CONFIG_CLEAN_FILES)
+
+maintainer-clean-generic:
+	@echo "This command is intended for maintainers to use"
+	@echo "it deletes files that may require special tools to rebuild."
+clean: clean-recursive
+
+clean-am: clean-generic mostlyclean-am
+
+distclean: distclean-recursive
+	-rm -f $(am__CONFIG_DISTCLEAN_FILES)
+	-rm -f Makefile
+distclean-am: clean-am distclean-generic distclean-hdr distclean-tags
+
+dvi: dvi-recursive
+
+dvi-am:
+
+html: html-recursive
+
+info: info-recursive
+
+info-am:
+
+install-data-am: install-mgizadocDATA install-mgizascriptsSCRIPTS
+
+install-dvi: install-dvi-recursive
+
+install-exec-am:
+
+install-html: install-html-recursive
+
+install-info: install-info-recursive
+
+install-man:
+
+install-pdf: install-pdf-recursive
+
+install-ps: install-ps-recursive
+
+installcheck-am:
+
+maintainer-clean: maintainer-clean-recursive
+	-rm -f $(am__CONFIG_DISTCLEAN_FILES)
+	-rm -rf $(top_srcdir)/autom4te.cache
+	-rm -f Makefile
+maintainer-clean-am: distclean-am maintainer-clean-generic
+
+mostlyclean: mostlyclean-recursive
+
+mostlyclean-am: mostlyclean-generic
+
+pdf: pdf-recursive
+
+pdf-am:
+
+ps: ps-recursive
+
+ps-am:
+
+uninstall-am: uninstall-mgizadocDATA uninstall-mgizascriptsSCRIPTS
+
+.MAKE: $(RECURSIVE_CLEAN_TARGETS) $(RECURSIVE_TARGETS) install-am \
+	install-strip
+
+.PHONY: $(RECURSIVE_CLEAN_TARGETS) $(RECURSIVE_TARGETS) CTAGS GTAGS \
+	all all-am am--refresh check check-am clean clean-generic \
+	ctags ctags-recursive dist dist-all dist-bzip2 dist-gzip \
+	dist-hook dist-lzma dist-shar dist-tarZ dist-zip distcheck \
+	distclean distclean-generic distclean-hdr distclean-tags \
+	distcleancheck distdir distuninstallcheck dvi dvi-am html \
+	html-am info info-am install install-am install-data \
+	install-data-am install-dvi install-dvi-am install-exec \
+	install-exec-am install-html install-html-am install-info \
+	install-info-am install-man install-mgizadocDATA \
+	install-mgizascriptsSCRIPTS install-pdf install-pdf-am \
+	install-ps install-ps-am install-strip installcheck \
+	installcheck-am installdirs installdirs-am maintainer-clean \
+	maintainer-clean-generic mostlyclean mostlyclean-generic pdf \
+	pdf-am ps ps-am tags tags-recursive uninstall uninstall-am \
+	uninstall-mgizadocDATA uninstall-mgizascriptsSCRIPTS
+
+# Copy all the spec files. Of cource, only one is actually used.
+dist-hook:
+	for specfile in *.spec; do \
+		if test -f $$specfile; then \
+			cp -p $$specfile $(distdir); \
+		fi \
+	done
+# Tell versions [3.59,3.63) of GNU make to not export all variables.
+# Otherwise a system limit (for SysV at least) may be exceeded.
+.NOEXPORT:
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/NEWS
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/NEWS
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/README
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/README
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/TODO.tasks
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/TODO.tasks
@ -0,0 +1,6 @@
+<?xml version="1.0"?>
+<gtodo>
+  <category title="Personal" place="0"/>
+  <category title="Business" place="1"/>
+  <category title="Unfiled" place="2"/>
+</gtodo>
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/aclocal.m4
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/aclocal.m4
@ -0,0 +1,932 @@
+# generated automatically by aclocal 1.10.1 -*- Autoconf -*-
+
+# Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
+# 2005, 2006, 2007, 2008  Free Software Foundation, Inc.
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY, to the extent permitted by law; without
+# even the implied warranty of MERCHANTABILITY or FITNESS FOR A
+# PARTICULAR PURPOSE.
+
+m4_ifndef([AC_AUTOCONF_VERSION],
+  [m4_copy([m4_PACKAGE_VERSION], [AC_AUTOCONF_VERSION])])dnl
+m4_if(AC_AUTOCONF_VERSION, [2.62],,
+[m4_warning([this file was generated for autoconf 2.62.
+You have another version of autoconf.  It may work, but is not guaranteed to.
+If you have problems, you may need to regenerate the build system entirely.
+To do so, use the procedure documented by the package, typically `autoreconf'.])])
+
+# Copyright (C) 2002, 2003, 2005, 2006, 2007  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# AM_AUTOMAKE_VERSION(VERSION)
+# ----------------------------
+# Automake X.Y traces this macro to ensure aclocal.m4 has been
+# generated from the m4 files accompanying Automake X.Y.
+# (This private macro should not be called outside this file.)
+AC_DEFUN([AM_AUTOMAKE_VERSION],
+[am__api_version='1.10'
+dnl Some users find AM_AUTOMAKE_VERSION and mistake it for a way to
+dnl require some minimum version.  Point them to the right macro.
+m4_if([$1], [1.10.1], [],
+      [AC_FATAL([Do not call $0, use AM_INIT_AUTOMAKE([$1]).])])dnl
+])
+
+# _AM_AUTOCONF_VERSION(VERSION)
+# -----------------------------
+# aclocal traces this macro to find the Autoconf version.
+# This is a private macro too.  Using m4_define simplifies
+# the logic in aclocal, which can simply ignore this definition.
+m4_define([_AM_AUTOCONF_VERSION], [])
+
+# AM_SET_CURRENT_AUTOMAKE_VERSION
+# -------------------------------
+# Call AM_AUTOMAKE_VERSION and AM_AUTOMAKE_VERSION so they can be traced.
+# This function is AC_REQUIREd by AC_INIT_AUTOMAKE.
+AC_DEFUN([AM_SET_CURRENT_AUTOMAKE_VERSION],
+[AM_AUTOMAKE_VERSION([1.10.1])dnl
+m4_ifndef([AC_AUTOCONF_VERSION],
+  [m4_copy([m4_PACKAGE_VERSION], [AC_AUTOCONF_VERSION])])dnl
+_AM_AUTOCONF_VERSION(AC_AUTOCONF_VERSION)])
+
+# AM_AUX_DIR_EXPAND                                         -*- Autoconf -*-
+
+# Copyright (C) 2001, 2003, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# For projects using AC_CONFIG_AUX_DIR([foo]), Autoconf sets
+# $ac_aux_dir to `$srcdir/foo'.  In other projects, it is set to
+# `$srcdir', `$srcdir/..', or `$srcdir/../..'.
+#
+# Of course, Automake must honor this variable whenever it calls a
+# tool from the auxiliary directory.  The problem is that $srcdir (and
+# therefore $ac_aux_dir as well) can be either absolute or relative,
+# depending on how configure is run.  This is pretty annoying, since
+# it makes $ac_aux_dir quite unusable in subdirectories: in the top
+# source directory, any form will work fine, but in subdirectories a
+# relative path needs to be adjusted first.
+#
+# $ac_aux_dir/missing
+#    fails when called from a subdirectory if $ac_aux_dir is relative
+# $top_srcdir/$ac_aux_dir/missing
+#    fails if $ac_aux_dir is absolute,
+#    fails when called from a subdirectory in a VPATH build with
+#          a relative $ac_aux_dir
+#
+# The reason of the latter failure is that $top_srcdir and $ac_aux_dir
+# are both prefixed by $srcdir.  In an in-source build this is usually
+# harmless because $srcdir is `.', but things will broke when you
+# start a VPATH build or use an absolute $srcdir.
+#
+# So we could use something similar to $top_srcdir/$ac_aux_dir/missing,
+# iff we strip the leading $srcdir from $ac_aux_dir.  That would be:
+#   am_aux_dir='\$(top_srcdir)/'`expr "$ac_aux_dir" : "$srcdir//*\(.*\)"`
+# and then we would define $MISSING as
+#   MISSING="\${SHELL} $am_aux_dir/missing"
+# This will work as long as MISSING is not called from configure, because
+# unfortunately $(top_srcdir) has no meaning in configure.
+# However there are other variables, like CC, which are often used in
+# configure, and could therefore not use this "fixed" $ac_aux_dir.
+#
+# Another solution, used here, is to always expand $ac_aux_dir to an
+# absolute PATH.  The drawback is that using absolute paths prevent a
+# configured tree to be moved without reconfiguration.
+
+AC_DEFUN([AM_AUX_DIR_EXPAND],
+[dnl Rely on autoconf to set up CDPATH properly.
+AC_PREREQ([2.50])dnl
+# expand $ac_aux_dir to an absolute path
+am_aux_dir=`cd $ac_aux_dir && pwd`
+])
+
+
+# Copyright (C) 1996, 1997, 1999, 2000, 2001, 2002, 2003, 2005
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 4
+
+# This was merged into AC_PROG_CC in Autoconf.
+
+AU_DEFUN([AM_PROG_CC_STDC],
+[AC_PROG_CC
+AC_DIAGNOSE([obsolete], [$0:
+	your code should no longer depend upon `am_cv_prog_cc_stdc', but upon
+	`ac_cv_prog_cc_stdc'.  Remove this warning and the assignment when
+	you adjust the code.  You can also remove the above call to
+	AC_PROG_CC if you already called it elsewhere.])
+am_cv_prog_cc_stdc=$ac_cv_prog_cc_stdc
+])
+AU_DEFUN([fp_PROG_CC_STDC])
+
+# AM_CONDITIONAL                                            -*- Autoconf -*-
+
+# Copyright (C) 1997, 2000, 2001, 2003, 2004, 2005, 2006
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 8
+
+# AM_CONDITIONAL(NAME, SHELL-CONDITION)
+# -------------------------------------
+# Define a conditional.
+AC_DEFUN([AM_CONDITIONAL],
+[AC_PREREQ(2.52)dnl
+ ifelse([$1], [TRUE],  [AC_FATAL([$0: invalid condition: $1])],
+	[$1], [FALSE], [AC_FATAL([$0: invalid condition: $1])])dnl
+AC_SUBST([$1_TRUE])dnl
+AC_SUBST([$1_FALSE])dnl
+_AM_SUBST_NOTMAKE([$1_TRUE])dnl
+_AM_SUBST_NOTMAKE([$1_FALSE])dnl
+if $2; then
+  $1_TRUE=
+  $1_FALSE='#'
+else
+  $1_TRUE='#'
+  $1_FALSE=
+fi
+AC_CONFIG_COMMANDS_PRE(
+[if test -z "${$1_TRUE}" && test -z "${$1_FALSE}"; then
+  AC_MSG_ERROR([[conditional "$1" was never defined.
+Usually this means the macro was only invoked conditionally.]])
+fi])])
+
+# Copyright (C) 1999, 2000, 2001, 2002, 2003, 2004, 2005, 2006
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 9
+
+# There are a few dirty hacks below to avoid letting `AC_PROG_CC' be
+# written in clear, in which case automake, when reading aclocal.m4,
+# will think it sees a *use*, and therefore will trigger all it's
+# C support machinery.  Also note that it means that autoscan, seeing
+# CC etc. in the Makefile, will ask for an AC_PROG_CC use...
+
+
+# _AM_DEPENDENCIES(NAME)
+# ----------------------
+# See how the compiler implements dependency checking.
+# NAME is "CC", "CXX", "GCJ", or "OBJC".
+# We try a few techniques and use that to set a single cache variable.
+#
+# We don't AC_REQUIRE the corresponding AC_PROG_CC since the latter was
+# modified to invoke _AM_DEPENDENCIES(CC); we would have a circular
+# dependency, and given that the user is not expected to run this macro,
+# just rely on AC_PROG_CC.
+AC_DEFUN([_AM_DEPENDENCIES],
+[AC_REQUIRE([AM_SET_DEPDIR])dnl
+AC_REQUIRE([AM_OUTPUT_DEPENDENCY_COMMANDS])dnl
+AC_REQUIRE([AM_MAKE_INCLUDE])dnl
+AC_REQUIRE([AM_DEP_TRACK])dnl
+
+ifelse([$1], CC,   [depcc="$CC"   am_compiler_list=],
+       [$1], CXX,  [depcc="$CXX"  am_compiler_list=],
+       [$1], OBJC, [depcc="$OBJC" am_compiler_list='gcc3 gcc'],
+       [$1], UPC,  [depcc="$UPC"  am_compiler_list=],
+       [$1], GCJ,  [depcc="$GCJ"  am_compiler_list='gcc3 gcc'],
+                   [depcc="$$1"   am_compiler_list=])
+
+AC_CACHE_CHECK([dependency style of $depcc],
+               [am_cv_$1_dependencies_compiler_type],
+[if test -z "$AMDEP_TRUE" && test -f "$am_depcomp"; then
+  # We make a subdir and do the tests there.  Otherwise we can end up
+  # making bogus files that we don't know about and never remove.  For
+  # instance it was reported that on HP-UX the gcc test will end up
+  # making a dummy file named `D' -- because `-MD' means `put the output
+  # in D'.
+  mkdir conftest.dir
+  # Copy depcomp to subdir because otherwise we won't find it if we're
+  # using a relative directory.
+  cp "$am_depcomp" conftest.dir
+  cd conftest.dir
+  # We will build objects and dependencies in a subdirectory because
+  # it helps to detect inapplicable dependency modes.  For instance
+  # both Tru64's cc and ICC support -MD to output dependencies as a
+  # side effect of compilation, but ICC will put the dependencies in
+  # the current directory while Tru64 will put them in the object
+  # directory.
+  mkdir sub
+
+  am_cv_$1_dependencies_compiler_type=none
+  if test "$am_compiler_list" = ""; then
+     am_compiler_list=`sed -n ['s/^#*\([a-zA-Z0-9]*\))$/\1/p'] < ./depcomp`
+  fi
+  for depmode in $am_compiler_list; do
+    # Setup a source with many dependencies, because some compilers
+    # like to wrap large dependency lists on column 80 (with \), and
+    # we should not choose a depcomp mode which is confused by this.
+    #
+    # We need to recreate these files for each test, as the compiler may
+    # overwrite some of them when testing with obscure command lines.
+    # This happens at least with the AIX C compiler.
+    : > sub/conftest.c
+    for i in 1 2 3 4 5 6; do
+      echo '#include "conftst'$i'.h"' >> sub/conftest.c
+      # Using `: > sub/conftst$i.h' creates only sub/conftst1.h with
+      # Solaris 8's {/usr,}/bin/sh.
+      touch sub/conftst$i.h
+    done
+    echo "${am__include} ${am__quote}sub/conftest.Po${am__quote}" > confmf
+
+    case $depmode in
+    nosideeffect)
+      # after this tag, mechanisms are not by side-effect, so they'll
+      # only be used when explicitly requested
+      if test "x$enable_dependency_tracking" = xyes; then
+	continue
+      else
+	break
+      fi
+      ;;
+    none) break ;;
+    esac
+    # We check with `-c' and `-o' for the sake of the "dashmstdout"
+    # mode.  It turns out that the SunPro C++ compiler does not properly
+    # handle `-M -o', and we need to detect this.
+    if depmode=$depmode \
+       source=sub/conftest.c object=sub/conftest.${OBJEXT-o} \
+       depfile=sub/conftest.Po tmpdepfile=sub/conftest.TPo \
+       $SHELL ./depcomp $depcc -c -o sub/conftest.${OBJEXT-o} sub/conftest.c \
+         >/dev/null 2>conftest.err &&
+       grep sub/conftst1.h sub/conftest.Po > /dev/null 2>&1 &&
+       grep sub/conftst6.h sub/conftest.Po > /dev/null 2>&1 &&
+       grep sub/conftest.${OBJEXT-o} sub/conftest.Po > /dev/null 2>&1 &&
+       ${MAKE-make} -s -f confmf > /dev/null 2>&1; then
+      # icc doesn't choke on unknown options, it will just issue warnings
+      # or remarks (even with -Werror).  So we grep stderr for any message
+      # that says an option was ignored or not supported.
+      # When given -MP, icc 7.0 and 7.1 complain thusly:
+      #   icc: Command line warning: ignoring option '-M'; no argument required
+      # The diagnosis changed in icc 8.0:
+      #   icc: Command line remark: option '-MP' not supported
+      if (grep 'ignoring option' conftest.err ||
+          grep 'not supported' conftest.err) >/dev/null 2>&1; then :; else
+        am_cv_$1_dependencies_compiler_type=$depmode
+        break
+      fi
+    fi
+  done
+
+  cd ..
+  rm -rf conftest.dir
+else
+  am_cv_$1_dependencies_compiler_type=none
+fi
+])
+AC_SUBST([$1DEPMODE], [depmode=$am_cv_$1_dependencies_compiler_type])
+AM_CONDITIONAL([am__fastdep$1], [
+  test "x$enable_dependency_tracking" != xno \
+  && test "$am_cv_$1_dependencies_compiler_type" = gcc3])
+])
+
+
+# AM_SET_DEPDIR
+# -------------
+# Choose a directory name for dependency files.
+# This macro is AC_REQUIREd in _AM_DEPENDENCIES
+AC_DEFUN([AM_SET_DEPDIR],
+[AC_REQUIRE([AM_SET_LEADING_DOT])dnl
+AC_SUBST([DEPDIR], ["${am__leading_dot}deps"])dnl
+])
+
+
+# AM_DEP_TRACK
+# ------------
+AC_DEFUN([AM_DEP_TRACK],
+[AC_ARG_ENABLE(dependency-tracking,
+[  --disable-dependency-tracking  speeds up one-time build
+  --enable-dependency-tracking   do not reject slow dependency extractors])
+if test "x$enable_dependency_tracking" != xno; then
+  am_depcomp="$ac_aux_dir/depcomp"
+  AMDEPBACKSLASH='\'
+fi
+AM_CONDITIONAL([AMDEP], [test "x$enable_dependency_tracking" != xno])
+AC_SUBST([AMDEPBACKSLASH])dnl
+_AM_SUBST_NOTMAKE([AMDEPBACKSLASH])dnl
+])
+
+# Generate code to set up dependency tracking.              -*- Autoconf -*-
+
+# Copyright (C) 1999, 2000, 2001, 2002, 2003, 2004, 2005
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+#serial 3
+
+# _AM_OUTPUT_DEPENDENCY_COMMANDS
+# ------------------------------
+AC_DEFUN([_AM_OUTPUT_DEPENDENCY_COMMANDS],
+[for mf in $CONFIG_FILES; do
+  # Strip MF so we end up with the name of the file.
+  mf=`echo "$mf" | sed -e 's/:.*$//'`
+  # Check whether this is an Automake generated Makefile or not.
+  # We used to match only the files named `Makefile.in', but
+  # some people rename them; so instead we look at the file content.
+  # Grep'ing the first line is not enough: some people post-process
+  # each Makefile.in and add a new line on top of each file to say so.
+  # Grep'ing the whole file is not good either: AIX grep has a line
+  # limit of 2048, but all sed's we know have understand at least 4000.
+  if sed -n 's,^#.*generated by automake.*,X,p' "$mf" | grep X >/dev/null 2>&1; then
+    dirpart=`AS_DIRNAME("$mf")`
+  else
+    continue
+  fi
+  # Extract the definition of DEPDIR, am__include, and am__quote
+  # from the Makefile without running `make'.
+  DEPDIR=`sed -n 's/^DEPDIR = //p' < "$mf"`
+  test -z "$DEPDIR" && continue
+  am__include=`sed -n 's/^am__include = //p' < "$mf"`
+  test -z "am__include" && continue
+  am__quote=`sed -n 's/^am__quote = //p' < "$mf"`
+  # When using ansi2knr, U may be empty or an underscore; expand it
+  U=`sed -n 's/^U = //p' < "$mf"`
+  # Find all dependency output files, they are included files with
+  # $(DEPDIR) in their names.  We invoke sed twice because it is the
+  # simplest approach to changing $(DEPDIR) to its actual value in the
+  # expansion.
+  for file in `sed -n "
+    s/^$am__include $am__quote\(.*(DEPDIR).*\)$am__quote"'$/\1/p' <"$mf" | \
+       sed -e 's/\$(DEPDIR)/'"$DEPDIR"'/g' -e 's/\$U/'"$U"'/g'`; do
+    # Make sure the directory exists.
+    test -f "$dirpart/$file" && continue
+    fdir=`AS_DIRNAME(["$file"])`
+    AS_MKDIR_P([$dirpart/$fdir])
+    # echo "creating $dirpart/$file"
+    echo '# dummy' > "$dirpart/$file"
+  done
+done
+])# _AM_OUTPUT_DEPENDENCY_COMMANDS
+
+
+# AM_OUTPUT_DEPENDENCY_COMMANDS
+# -----------------------------
+# This macro should only be invoked once -- use via AC_REQUIRE.
+#
+# This code is only required when automatic dependency tracking
+# is enabled.  FIXME.  This creates each `.P' file that we will
+# need in order to bootstrap the dependency handling code.
+AC_DEFUN([AM_OUTPUT_DEPENDENCY_COMMANDS],
+[AC_CONFIG_COMMANDS([depfiles],
+     [test x"$AMDEP_TRUE" != x"" || _AM_OUTPUT_DEPENDENCY_COMMANDS],
+     [AMDEP_TRUE="$AMDEP_TRUE" ac_aux_dir="$ac_aux_dir"])
+])
+
+# Copyright (C) 1996, 1997, 2000, 2001, 2003, 2005
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 8
+
+# AM_CONFIG_HEADER is obsolete.  It has been replaced by AC_CONFIG_HEADERS.
+AU_DEFUN([AM_CONFIG_HEADER], [AC_CONFIG_HEADERS($@)])
+
+# Do all the work for Automake.                             -*- Autoconf -*-
+
+# Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
+# 2005, 2006, 2008 Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 13
+
+# This macro actually does too much.  Some checks are only needed if
+# your package does certain things.  But this isn't really a big deal.
+
+# AM_INIT_AUTOMAKE(PACKAGE, VERSION, [NO-DEFINE])
+# AM_INIT_AUTOMAKE([OPTIONS])
+# -----------------------------------------------
+# The call with PACKAGE and VERSION arguments is the old style
+# call (pre autoconf-2.50), which is being phased out.  PACKAGE
+# and VERSION should now be passed to AC_INIT and removed from
+# the call to AM_INIT_AUTOMAKE.
+# We support both call styles for the transition.  After
+# the next Automake release, Autoconf can make the AC_INIT
+# arguments mandatory, and then we can depend on a new Autoconf
+# release and drop the old call support.
+AC_DEFUN([AM_INIT_AUTOMAKE],
+[AC_PREREQ([2.60])dnl
+dnl Autoconf wants to disallow AM_ names.  We explicitly allow
+dnl the ones we care about.
+m4_pattern_allow([^AM_[A-Z]+FLAGS$])dnl
+AC_REQUIRE([AM_SET_CURRENT_AUTOMAKE_VERSION])dnl
+AC_REQUIRE([AC_PROG_INSTALL])dnl
+if test "`cd $srcdir && pwd`" != "`pwd`"; then
+  # Use -I$(srcdir) only when $(srcdir) != ., so that make's output
+  # is not polluted with repeated "-I."
+  AC_SUBST([am__isrc], [' -I$(srcdir)'])_AM_SUBST_NOTMAKE([am__isrc])dnl
+  # test to see if srcdir already configured
+  if test -f $srcdir/config.status; then
+    AC_MSG_ERROR([source directory already configured; run "make distclean" there first])
+  fi
+fi
+
+# test whether we have cygpath
+if test -z "$CYGPATH_W"; then
+  if (cygpath --version) >/dev/null 2>/dev/null; then
+    CYGPATH_W='cygpath -w'
+  else
+    CYGPATH_W=echo
+  fi
+fi
+AC_SUBST([CYGPATH_W])
+
+# Define the identity of the package.
+dnl Distinguish between old-style and new-style calls.
+m4_ifval([$2],
+[m4_ifval([$3], [_AM_SET_OPTION([no-define])])dnl
+ AC_SUBST([PACKAGE], [$1])dnl
+ AC_SUBST([VERSION], [$2])],
+[_AM_SET_OPTIONS([$1])dnl
+dnl Diagnose old-style AC_INIT with new-style AM_AUTOMAKE_INIT.
+m4_if(m4_ifdef([AC_PACKAGE_NAME], 1)m4_ifdef([AC_PACKAGE_VERSION], 1), 11,,
+  [m4_fatal([AC_INIT should be called with package and version arguments])])dnl
+ AC_SUBST([PACKAGE], ['AC_PACKAGE_TARNAME'])dnl
+ AC_SUBST([VERSION], ['AC_PACKAGE_VERSION'])])dnl
+
+_AM_IF_OPTION([no-define],,
+[AC_DEFINE_UNQUOTED(PACKAGE, "$PACKAGE", [Name of package])
+ AC_DEFINE_UNQUOTED(VERSION, "$VERSION", [Version number of package])])dnl
+
+# Some tools Automake needs.
+AC_REQUIRE([AM_SANITY_CHECK])dnl
+AC_REQUIRE([AC_ARG_PROGRAM])dnl
+AM_MISSING_PROG(ACLOCAL, aclocal-${am__api_version})
+AM_MISSING_PROG(AUTOCONF, autoconf)
+AM_MISSING_PROG(AUTOMAKE, automake-${am__api_version})
+AM_MISSING_PROG(AUTOHEADER, autoheader)
+AM_MISSING_PROG(MAKEINFO, makeinfo)
+AM_PROG_INSTALL_SH
+AM_PROG_INSTALL_STRIP
+AC_REQUIRE([AM_PROG_MKDIR_P])dnl
+# We need awk for the "check" target.  The system "awk" is bad on
+# some platforms.
+AC_REQUIRE([AC_PROG_AWK])dnl
+AC_REQUIRE([AC_PROG_MAKE_SET])dnl
+AC_REQUIRE([AM_SET_LEADING_DOT])dnl
+_AM_IF_OPTION([tar-ustar], [_AM_PROG_TAR([ustar])],
+              [_AM_IF_OPTION([tar-pax], [_AM_PROG_TAR([pax])],
+	      		     [_AM_PROG_TAR([v7])])])
+_AM_IF_OPTION([no-dependencies],,
+[AC_PROVIDE_IFELSE([AC_PROG_CC],
+                  [_AM_DEPENDENCIES(CC)],
+                  [define([AC_PROG_CC],
+                          defn([AC_PROG_CC])[_AM_DEPENDENCIES(CC)])])dnl
+AC_PROVIDE_IFELSE([AC_PROG_CXX],
+                  [_AM_DEPENDENCIES(CXX)],
+                  [define([AC_PROG_CXX],
+                          defn([AC_PROG_CXX])[_AM_DEPENDENCIES(CXX)])])dnl
+AC_PROVIDE_IFELSE([AC_PROG_OBJC],
+                  [_AM_DEPENDENCIES(OBJC)],
+                  [define([AC_PROG_OBJC],
+                          defn([AC_PROG_OBJC])[_AM_DEPENDENCIES(OBJC)])])dnl
+])
+])
+
+
+# When config.status generates a header, we must update the stamp-h file.
+# This file resides in the same directory as the config header
+# that is generated.  The stamp files are numbered to have different names.
+
+# Autoconf calls _AC_AM_CONFIG_HEADER_HOOK (when defined) in the
+# loop where config.status creates the headers, so we can generate
+# our stamp files there.
+AC_DEFUN([_AC_AM_CONFIG_HEADER_HOOK],
+[# Compute $1's index in $config_headers.
+_am_arg=$1
+_am_stamp_count=1
+for _am_header in $config_headers :; do
+  case $_am_header in
+    $_am_arg | $_am_arg:* )
+      break ;;
+    * )
+      _am_stamp_count=`expr $_am_stamp_count + 1` ;;
+  esac
+done
+echo "timestamp for $_am_arg" >`AS_DIRNAME(["$_am_arg"])`/stamp-h[]$_am_stamp_count])
+
+# Copyright (C) 2001, 2003, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# AM_PROG_INSTALL_SH
+# ------------------
+# Define $install_sh.
+AC_DEFUN([AM_PROG_INSTALL_SH],
+[AC_REQUIRE([AM_AUX_DIR_EXPAND])dnl
+install_sh=${install_sh-"\$(SHELL) $am_aux_dir/install-sh"}
+AC_SUBST(install_sh)])
+
+# Copyright (C) 2003, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 2
+
+# Check whether the underlying file-system supports filenames
+# with a leading dot.  For instance MS-DOS doesn't.
+AC_DEFUN([AM_SET_LEADING_DOT],
+[rm -rf .tst 2>/dev/null
+mkdir .tst 2>/dev/null
+if test -d .tst; then
+  am__leading_dot=.
+else
+  am__leading_dot=_
+fi
+rmdir .tst 2>/dev/null
+AC_SUBST([am__leading_dot])])
+
+# Add --enable-maintainer-mode option to configure.         -*- Autoconf -*-
+# From Jim Meyering
+
+# Copyright (C) 1996, 1998, 2000, 2001, 2002, 2003, 2004, 2005
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 4
+
+AC_DEFUN([AM_MAINTAINER_MODE],
+[AC_MSG_CHECKING([whether to enable maintainer-specific portions of Makefiles])
+  dnl maintainer-mode is disabled by default
+  AC_ARG_ENABLE(maintainer-mode,
+[  --enable-maintainer-mode  enable make rules and dependencies not useful
+			  (and sometimes confusing) to the casual installer],
+      USE_MAINTAINER_MODE=$enableval,
+      USE_MAINTAINER_MODE=no)
+  AC_MSG_RESULT([$USE_MAINTAINER_MODE])
+  AM_CONDITIONAL(MAINTAINER_MODE, [test $USE_MAINTAINER_MODE = yes])
+  MAINT=$MAINTAINER_MODE_TRUE
+  AC_SUBST(MAINT)dnl
+]
+)
+
+AU_DEFUN([jm_MAINTAINER_MODE], [AM_MAINTAINER_MODE])
+
+# Check to see how 'make' treats includes.	            -*- Autoconf -*-
+
+# Copyright (C) 2001, 2002, 2003, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 3
+
+# AM_MAKE_INCLUDE()
+# -----------------
+# Check to see how make treats includes.
+AC_DEFUN([AM_MAKE_INCLUDE],
+[am_make=${MAKE-make}
+cat > confinc << 'END'
+am__doit:
+	@echo done
+.PHONY: am__doit
+END
+# If we don't find an include directive, just comment out the code.
+AC_MSG_CHECKING([for style of include used by $am_make])
+am__include="#"
+am__quote=
+_am_result=none
+# First try GNU make style include.
+echo "include confinc" > confmf
+# We grep out `Entering directory' and `Leaving directory'
+# messages which can occur if `w' ends up in MAKEFLAGS.
+# In particular we don't look at `^make:' because GNU make might
+# be invoked under some other name (usually "gmake"), in which
+# case it prints its new name instead of `make'.
+if test "`$am_make -s -f confmf 2> /dev/null | grep -v 'ing directory'`" = "done"; then
+   am__include=include
+   am__quote=
+   _am_result=GNU
+fi
+# Now try BSD make style include.
+if test "$am__include" = "#"; then
+   echo '.include "confinc"' > confmf
+   if test "`$am_make -s -f confmf 2> /dev/null`" = "done"; then
+      am__include=.include
+      am__quote="\""
+      _am_result=BSD
+   fi
+fi
+AC_SUBST([am__include])
+AC_SUBST([am__quote])
+AC_MSG_RESULT([$_am_result])
+rm -f confinc confmf
+])
+
+# Fake the existence of programs that GNU maintainers use.  -*- Autoconf -*-
+
+# Copyright (C) 1997, 1999, 2000, 2001, 2003, 2004, 2005
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 5
+
+# AM_MISSING_PROG(NAME, PROGRAM)
+# ------------------------------
+AC_DEFUN([AM_MISSING_PROG],
+[AC_REQUIRE([AM_MISSING_HAS_RUN])
+$1=${$1-"${am_missing_run}$2"}
+AC_SUBST($1)])
+
+
+# AM_MISSING_HAS_RUN
+# ------------------
+# Define MISSING if not defined so far and test if it supports --run.
+# If it does, set am_missing_run to use it, otherwise, to nothing.
+AC_DEFUN([AM_MISSING_HAS_RUN],
+[AC_REQUIRE([AM_AUX_DIR_EXPAND])dnl
+AC_REQUIRE_AUX_FILE([missing])dnl
+test x"${MISSING+set}" = xset || MISSING="\${SHELL} $am_aux_dir/missing"
+# Use eval to expand $SHELL
+if eval "$MISSING --run true"; then
+  am_missing_run="$MISSING --run "
+else
+  am_missing_run=
+  AC_MSG_WARN([`missing' script is too old or missing])
+fi
+])
+
+# Copyright (C) 2003, 2004, 2005, 2006  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# AM_PROG_MKDIR_P
+# ---------------
+# Check for `mkdir -p'.
+AC_DEFUN([AM_PROG_MKDIR_P],
+[AC_PREREQ([2.60])dnl
+AC_REQUIRE([AC_PROG_MKDIR_P])dnl
+dnl Automake 1.8 to 1.9.6 used to define mkdir_p.  We now use MKDIR_P,
+dnl while keeping a definition of mkdir_p for backward compatibility.
+dnl @MKDIR_P@ is magic: AC_OUTPUT adjusts its value for each Makefile.
+dnl However we cannot define mkdir_p as $(MKDIR_P) for the sake of
+dnl Makefile.ins that do not define MKDIR_P, so we do our own
+dnl adjustment using top_builddir (which is defined more often than
+dnl MKDIR_P).
+AC_SUBST([mkdir_p], ["$MKDIR_P"])dnl
+case $mkdir_p in
+  [[\\/$]]* | ?:[[\\/]]*) ;;
+  */*) mkdir_p="\$(top_builddir)/$mkdir_p" ;;
+esac
+])
+
+# Helper functions for option handling.                     -*- Autoconf -*-
+
+# Copyright (C) 2001, 2002, 2003, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 3
+
+# _AM_MANGLE_OPTION(NAME)
+# -----------------------
+AC_DEFUN([_AM_MANGLE_OPTION],
+[[_AM_OPTION_]m4_bpatsubst($1, [[^a-zA-Z0-9_]], [_])])
+
+# _AM_SET_OPTION(NAME)
+# ------------------------------
+# Set option NAME.  Presently that only means defining a flag for this option.
+AC_DEFUN([_AM_SET_OPTION],
+[m4_define(_AM_MANGLE_OPTION([$1]), 1)])
+
+# _AM_SET_OPTIONS(OPTIONS)
+# ----------------------------------
+# OPTIONS is a space-separated list of Automake options.
+AC_DEFUN([_AM_SET_OPTIONS],
+[AC_FOREACH([_AM_Option], [$1], [_AM_SET_OPTION(_AM_Option)])])
+
+# _AM_IF_OPTION(OPTION, IF-SET, [IF-NOT-SET])
+# -------------------------------------------
+# Execute IF-SET if OPTION is set, IF-NOT-SET otherwise.
+AC_DEFUN([_AM_IF_OPTION],
+[m4_ifset(_AM_MANGLE_OPTION([$1]), [$2], [$3])])
+
+# Check to make sure that the build environment is sane.    -*- Autoconf -*-
+
+# Copyright (C) 1996, 1997, 2000, 2001, 2003, 2005
+# Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 4
+
+# AM_SANITY_CHECK
+# ---------------
+AC_DEFUN([AM_SANITY_CHECK],
+[AC_MSG_CHECKING([whether build environment is sane])
+# Just in case
+sleep 1
+echo timestamp > conftest.file
+# Do `set' in a subshell so we don't clobber the current shell's
+# arguments.  Must try -L first in case configure is actually a
+# symlink; some systems play weird games with the mod time of symlinks
+# (eg FreeBSD returns the mod time of the symlink's containing
+# directory).
+if (
+   set X `ls -Lt $srcdir/configure conftest.file 2> /dev/null`
+   if test "$[*]" = "X"; then
+      # -L didn't work.
+      set X `ls -t $srcdir/configure conftest.file`
+   fi
+   rm -f conftest.file
+   if test "$[*]" != "X $srcdir/configure conftest.file" \
+      && test "$[*]" != "X conftest.file $srcdir/configure"; then
+
+      # If neither matched, then we have a broken ls.  This can happen
+      # if, for instance, CONFIG_SHELL is bash and it inherits a
+      # broken ls alias from the environment.  This has actually
+      # happened.  Such a system could not be considered "sane".
+      AC_MSG_ERROR([ls -t appears to fail.  Make sure there is not a broken
+alias in your environment])
+   fi
+
+   test "$[2]" = conftest.file
+   )
+then
+   # Ok.
+   :
+else
+   AC_MSG_ERROR([newly created file is older than distributed files!
+Check your system clock])
+fi
+AC_MSG_RESULT(yes)])
+
+# Copyright (C) 2001, 2003, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# AM_PROG_INSTALL_STRIP
+# ---------------------
+# One issue with vendor `install' (even GNU) is that you can't
+# specify the program used to strip binaries.  This is especially
+# annoying in cross-compiling environments, where the build's strip
+# is unlikely to handle the host's binaries.
+# Fortunately install-sh will honor a STRIPPROG variable, so we
+# always use install-sh in `make install-strip', and initialize
+# STRIPPROG with the value of the STRIP variable (set by the user).
+AC_DEFUN([AM_PROG_INSTALL_STRIP],
+[AC_REQUIRE([AM_PROG_INSTALL_SH])dnl
+# Installed binaries are usually stripped using `strip' when the user
+# run `make install-strip'.  However `strip' might not be the right
+# tool to use in cross-compilation environments, therefore Automake
+# will honor the `STRIP' environment variable to overrule this program.
+dnl Don't test for $cross_compiling = yes, because it might be `maybe'.
+if test "$cross_compiling" != no; then
+  AC_CHECK_TOOL([STRIP], [strip], :)
+fi
+INSTALL_STRIP_PROGRAM="\$(install_sh) -c -s"
+AC_SUBST([INSTALL_STRIP_PROGRAM])])
+
+# Copyright (C) 2006  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# _AM_SUBST_NOTMAKE(VARIABLE)
+# ---------------------------
+# Prevent Automake from outputting VARIABLE = @VARIABLE@ in Makefile.in.
+# This macro is traced by Automake.
+AC_DEFUN([_AM_SUBST_NOTMAKE])
+
+# Check how to create a tarball.                            -*- Autoconf -*-
+
+# Copyright (C) 2004, 2005  Free Software Foundation, Inc.
+#
+# This file is free software; the Free Software Foundation
+# gives unlimited permission to copy and/or distribute it,
+# with or without modifications, as long as this notice is preserved.
+
+# serial 2
+
+# _AM_PROG_TAR(FORMAT)
+# --------------------
+# Check how to create a tarball in format FORMAT.
+# FORMAT should be one of `v7', `ustar', or `pax'.
+#
+# Substitute a variable $(am__tar) that is a command
+# writing to stdout a FORMAT-tarball containing the directory
+# $tardir.
+#     tardir=directory && $(am__tar) > result.tar
+#
+# Substitute a variable $(am__untar) that extract such
+# a tarball read from stdin.
+#     $(am__untar) < result.tar
+AC_DEFUN([_AM_PROG_TAR],
+[# Always define AMTAR for backward compatibility.
+AM_MISSING_PROG([AMTAR], [tar])
+m4_if([$1], [v7],
+     [am__tar='${AMTAR} chof - "$$tardir"'; am__untar='${AMTAR} xf -'],
+     [m4_case([$1], [ustar],, [pax],,
+              [m4_fatal([Unknown tar format])])
+AC_MSG_CHECKING([how to create a $1 tar archive])
+# Loop over all known methods to create a tar archive until one works.
+_am_tools='gnutar m4_if([$1], [ustar], [plaintar]) pax cpio none'
+_am_tools=${am_cv_prog_tar_$1-$_am_tools}
+# Do not fold the above two line into one, because Tru64 sh and
+# Solaris sh will not grok spaces in the rhs of `-'.
+for _am_tool in $_am_tools
+do
+  case $_am_tool in
+  gnutar)
+    for _am_tar in tar gnutar gtar;
+    do
+      AM_RUN_LOG([$_am_tar --version]) && break
+    done
+    am__tar="$_am_tar --format=m4_if([$1], [pax], [posix], [$1]) -chf - "'"$$tardir"'
+    am__tar_="$_am_tar --format=m4_if([$1], [pax], [posix], [$1]) -chf - "'"$tardir"'
+    am__untar="$_am_tar -xf -"
+    ;;
+  plaintar)
+    # Must skip GNU tar: if it does not support --format= it doesn't create
+    # ustar tarball either.
+    (tar --version) >/dev/null 2>&1 && continue
+    am__tar='tar chf - "$$tardir"'
+    am__tar_='tar chf - "$tardir"'
+    am__untar='tar xf -'
+    ;;
+  pax)
+    am__tar='pax -L -x $1 -w "$$tardir"'
+    am__tar_='pax -L -x $1 -w "$tardir"'
+    am__untar='pax -r'
+    ;;
+  cpio)
+    am__tar='find "$$tardir" -print | cpio -o -H $1 -L'
+    am__tar_='find "$tardir" -print | cpio -o -H $1 -L'
+    am__untar='cpio -i -H $1 -d'
+    ;;
+  none)
+    am__tar=false
+    am__tar_=false
+    am__untar=false
+    ;;
+  esac
+
+  # If the value was cached, stop now.  We just wanted to have am__tar
+  # and am__untar set.
+  test -n "${am_cv_prog_tar_$1}" && break
+
+  # tar/untar a dummy directory, and stop if the command works
+  rm -rf conftest.dir
+  mkdir conftest.dir
+  echo GrepMe > conftest.dir/file
+  AM_RUN_LOG([tardir=conftest.dir && eval $am__tar_ >conftest.tar])
+  rm -rf conftest.dir
+  if test -s conftest.tar; then
+    AM_RUN_LOG([$am__untar <conftest.tar])
+    grep GrepMe conftest.dir/file >/dev/null 2>&1 && break
+  fi
+done
+rm -rf conftest.dir
+
+AC_CACHE_VAL([am_cv_prog_tar_$1], [am_cv_prog_tar_$1=$_am_tool])
+AC_MSG_RESULT([$am_cv_prog_tar_$1])])
+AC_SUBST([am__tar])
+AC_SUBST([am__untar])
+]) # _AM_PROG_TAR
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/autogen.sh
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/autogen.sh
@ -0,0 +1,159 @@
+#!/bin/sh
+# Run this to generate all the initial makefiles, etc.
+
+srcdir=`dirname $0`
+test -z "$srcdir" && srcdir=.
+
+DIE=0
+
+if [ -n "$GNOME2_DIR" ]; then
+	ACLOCAL_FLAGS="-I $GNOME2_DIR/share/aclocal $ACLOCAL_FLAGS"
+	LD_LIBRARY_PATH="$GNOME2_DIR/lib:$LD_LIBRARY_PATH"
+	PATH="$GNOME2_DIR/bin:$PATH"
+	export PATH
+	export LD_LIBRARY_PATH
+fi
+
+(test -f $srcdir/configure.ac) || {
+    echo -n "**Error**: Directory "\`$srcdir\'" does not look like the"
+    echo " top-level package directory"
+    exit 1
+}
+
+(autoconf --version) < /dev/null > /dev/null 2>&1 || {
+  echo
+  echo "**Error**: You must have \`autoconf' installed."
+  echo "Download the appropriate package for your distribution,"
+  echo "or get the source tarball at ftp://ftp.gnu.org/pub/gnu/"
+  DIE=1
+}
+
+(grep "^IT_PROG_INTLTOOL" $srcdir/configure.ac >/dev/null) && {
+  (intltoolize --version) < /dev/null > /dev/null 2>&1 || {
+    echo 
+    echo "**Error**: You must have \`intltool' installed."
+    echo "You can get it from:"
+    echo "  ftp://ftp.gnome.org/pub/GNOME/"
+    DIE=1
+  }
+}
+
+(grep "^AM_PROG_XML_I18N_TOOLS" $srcdir/configure.ac >/dev/null) && {
+  (xml-i18n-toolize --version) < /dev/null > /dev/null 2>&1 || {
+    echo
+    echo "**Error**: You must have \`xml-i18n-toolize' installed."
+    echo "You can get it from:"
+    echo "  ftp://ftp.gnome.org/pub/GNOME/"
+    DIE=1
+  }
+}
+
+(grep "^AM_PROG_LIBTOOL" $srcdir/configure.ac >/dev/null) && {
+  (libtool --version) < /dev/null > /dev/null 2>&1 || {
+    echo
+    echo "**Error**: You must have \`libtool' installed."
+    echo "You can get it from: ftp://ftp.gnu.org/pub/gnu/"
+    DIE=1
+  }
+}
+
+(grep "^AM_GLIB_GNU_GETTEXT" $srcdir/configure.ac >/dev/null) && {
+  (grep "sed.*POTFILES" $srcdir/configure.ac) > /dev/null || \
+  (glib-gettextize --version) < /dev/null > /dev/null 2>&1 || {
+    echo
+    echo "**Error**: You must have \`glib' installed."
+    echo "You can get it from: ftp://ftp.gtk.org/pub/gtk"
+    DIE=1
+  }
+}
+
+(automake --version) < /dev/null > /dev/null 2>&1 || {
+  echo
+  echo "**Error**: You must have \`automake' installed."
+  echo "You can get it from: ftp://ftp.gnu.org/pub/gnu/"
+  DIE=1
+  NO_AUTOMAKE=yes
+}
+
+
+# if no automake, don't bother testing for aclocal
+test -n "$NO_AUTOMAKE" || (aclocal --version) < /dev/null > /dev/null 2>&1 || {
+  echo
+  echo "**Error**: Missing \`aclocal'.  The version of \`automake'"
+  echo "installed doesn't appear recent enough."
+  echo "You can get automake from ftp://ftp.gnu.org/pub/gnu/"
+  DIE=1
+}
+
+if test "$DIE" -eq 1; then
+  exit 1
+fi
+
+if test -z "$*"; then
+  echo "**Warning**: I am going to run \`configure' with no arguments."
+  echo "If you wish to pass any to it, please specify them on the"
+  echo \`$0\'" command line."
+  echo
+fi
+
+case $CC in
+xlc )
+  am_opt=--include-deps;;
+esac
+
+for coin in `find $srcdir -path $srcdir/CVS -prune -o -name configure.ac -print`
+do 
+  dr=`dirname $coin`
+  if test -f $dr/NO-AUTO-GEN; then
+    echo skipping $dr -- flagged as no auto-gen
+  else
+    echo processing $dr
+    ( cd $dr
+
+      aclocalinclude="$ACLOCAL_FLAGS"
+
+      if grep "^AM_GLIB_GNU_GETTEXT" configure.ac >/dev/null; then
+	echo "Creating $dr/aclocal.m4 ..."
+	test -r $dr/aclocal.m4 || touch $dr/aclocal.m4
+	echo "Running glib-gettextize...  Ignore non-fatal messages."
+	echo "no" | glib-gettextize --force --copy
+	echo "Making $dr/aclocal.m4 writable ..."
+	test -r $dr/aclocal.m4 && chmod u+w $dr/aclocal.m4
+      fi
+      if grep "^IT_PROG_INTLTOOL" configure.ac >/dev/null; then
+        echo "Running intltoolize..."
+	intltoolize --copy --force --automake
+      fi
+      if grep "^AM_PROG_XML_I18N_TOOLS" configure.ac >/dev/null; then
+        echo "Running xml-i18n-toolize..."
+	xml-i18n-toolize --copy --force --automake
+      fi
+      if grep "^AM_PROG_LIBTOOL" configure.ac >/dev/null; then
+	if test -z "$NO_LIBTOOLIZE" ; then 
+	  echo "Running libtoolize..."
+	  libtoolize --force --copy
+	fi
+      fi
+      echo "Running aclocal $aclocalinclude ..."
+      aclocal $aclocalinclude
+      if grep "^AM_CONFIG_HEADER" configure.ac >/dev/null; then
+	echo "Running autoheader..."
+	autoheader
+      fi
+      echo "Running automake --gnu $am_opt ..."
+      automake --add-missing --gnu $am_opt
+      echo "Running autoconf ..."
+      autoconf
+    )
+  fi
+done
+
+conf_flags="--enable-maintainer-mode"
+
+if test x$NOCONFIGURE = x; then
+  echo Running $srcdir/configure $conf_flags "$@" ...
+  $srcdir/configure $conf_flags "$@" \
+  && echo Now type \`make\' to compile. || exit 1
+else
+  echo Skipping configure process.
+fi
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.guess
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.guess
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.h
@ -0,0 +1,26 @@
+/* config.h.  Generated from config.h.in by configure.  */
+/* config.h.in.  Generated from configure.ac by autoheader.  */
+
+/* Name of package */
+#define PACKAGE "mgiza"
+
+/* Define to the address where bug reports for this package should be sent. */
+#define PACKAGE_BUGREPORT ""
+
+/* Define to the full name of this package. */
+#define PACKAGE_NAME "mgiza"
+
+/* Define to the full name and version of this package. */
+#define PACKAGE_STRING "mgiza 1.0"
+
+/* Define to the one symbol short name of this package. */
+#define PACKAGE_TARNAME "mgiza"
+
+/* Define to the version of this package. */
+#define PACKAGE_VERSION "1.0"
+
+/* Define to 1 if you have the ANSI C header files. */
+#define STDC_HEADERS 1
+
+/* Version number of package */
+#define VERSION "1.0"
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.h.in
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.h.in
@ -0,0 +1,25 @@
+/* config.h.in.  Generated from configure.ac by autoheader.  */
+
+/* Name of package */
+#undef PACKAGE
+
+/* Define to the address where bug reports for this package should be sent. */
+#undef PACKAGE_BUGREPORT
+
+/* Define to the full name of this package. */
+#undef PACKAGE_NAME
+
+/* Define to the full name and version of this package. */
+#undef PACKAGE_STRING
+
+/* Define to the one symbol short name of this package. */
+#undef PACKAGE_TARNAME
+
+/* Define to the version of this package. */
+#undef PACKAGE_VERSION
+
+/* Define to 1 if you have the ANSI C header files. */
+#undef STDC_HEADERS
+
+/* Version number of package */
+#undef VERSION
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.sub
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/config.sub
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/configure
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/configure
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/configure.ac
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/configure.ac
@ -0,0 +1,28 @@
+dnl Process this file with autoconf to produce a configure script.
+dnl Created by Anjuta application wizard.
+
+AC_INIT(mgiza, 1.0)
+
+AM_INIT_AUTOMAKE(AC_PACKAGE_NAME, AC_PACKAGE_VERSION)
+AM_CONFIG_HEADER(config.h)
+AM_MAINTAINER_MODE
+
+AC_ISC_POSIX
+AC_PROG_CXX
+AM_PROG_CC_STDC
+AC_HEADER_STDC
+
+
+
+AC_PROG_RANLIB
+AM_PROG_LIBTOOL
+AC_PROG_LIBTOOL
+
+
+
+
+AC_OUTPUT([
+Makefile
+src/Makefile
+src/mkcls/Makefile
+])
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/install-sh
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/install-sh
@ -0,0 +1,519 @@
+#!/bin/sh
+# install - install a program, script, or datafile
+
+scriptversion=2006-12-25.00
+
+# This originates from X11R5 (mit/util/scripts/install.sh), which was
+# later released in X11R6 (xc/config/util/install.sh) with the
+# following copyright and license.
+#
+# Copyright (C) 1994 X Consortium
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to
+# deal in the Software without restriction, including without limitation the
+# rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
+# sell copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
+# X CONSORTIUM BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN
+# AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNEC-
+# TION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+#
+# Except as contained in this notice, the name of the X Consortium shall not
+# be used in advertising or otherwise to promote the sale, use or other deal-
+# ings in this Software without prior written authorization from the X Consor-
+# tium.
+#
+#
+# FSF changes to this file are in the public domain.
+#
+# Calling this script install-sh is preferred over install.sh, to prevent
+# `make' implicit rules from creating a file called install from it
+# when there is no Makefile.
+#
+# This script is compatible with the BSD install script, but was written
+# from scratch.
+
+nl='
+'
+IFS=" ""	$nl"
+
+# set DOITPROG to echo to test this script
+
+# Don't use :- since 4.3BSD and earlier shells don't like it.
+doit=${DOITPROG-}
+if test -z "$doit"; then
+  doit_exec=exec
+else
+  doit_exec=$doit
+fi
+
+# Put in absolute file names if you don't have them in your path;
+# or use environment vars.
+
+chgrpprog=${CHGRPPROG-chgrp}
+chmodprog=${CHMODPROG-chmod}
+chownprog=${CHOWNPROG-chown}
+cmpprog=${CMPPROG-cmp}
+cpprog=${CPPROG-cp}
+mkdirprog=${MKDIRPROG-mkdir}
+mvprog=${MVPROG-mv}
+rmprog=${RMPROG-rm}
+stripprog=${STRIPPROG-strip}
+
+posix_glob='?'
+initialize_posix_glob='
+  test "$posix_glob" != "?" || {
+    if (set -f) 2>/dev/null; then
+      posix_glob=
+    else
+      posix_glob=:
+    fi
+  }
+'
+
+posix_mkdir=
+
+# Desired mode of installed file.
+mode=0755
+
+chgrpcmd=
+chmodcmd=$chmodprog
+chowncmd=
+mvcmd=$mvprog
+rmcmd="$rmprog -f"
+stripcmd=
+
+src=
+dst=
+dir_arg=
+dst_arg=
+
+copy_on_change=false
+no_target_directory=
+
+usage="\
+Usage: $0 [OPTION]... [-T] SRCFILE DSTFILE
+   or: $0 [OPTION]... SRCFILES... DIRECTORY
+   or: $0 [OPTION]... -t DIRECTORY SRCFILES...
+   or: $0 [OPTION]... -d DIRECTORIES...
+
+In the 1st form, copy SRCFILE to DSTFILE.
+In the 2nd and 3rd, copy all SRCFILES to DIRECTORY.
+In the 4th, create DIRECTORIES.
+
+Options:
+     --help     display this help and exit.
+     --version  display version info and exit.
+
+  -c            (ignored)
+  -C            install only if different (preserve the last data modification time)
+  -d            create directories instead of installing files.
+  -g GROUP      $chgrpprog installed files to GROUP.
+  -m MODE       $chmodprog installed files to MODE.
+  -o USER       $chownprog installed files to USER.
+  -s            $stripprog installed files.
+  -t DIRECTORY  install into DIRECTORY.
+  -T            report an error if DSTFILE is a directory.
+
+Environment variables override the default commands:
+  CHGRPPROG CHMODPROG CHOWNPROG CMPPROG CPPROG MKDIRPROG MVPROG
+  RMPROG STRIPPROG
+"
+
+while test $# -ne 0; do
+  case $1 in
+    -c) ;;
+
+    -C) copy_on_change=true;;
+
+    -d) dir_arg=true;;
+
+    -g) chgrpcmd="$chgrpprog $2"
+	shift;;
+
+    --help) echo "$usage"; exit $?;;
+
+    -m) mode=$2
+	case $mode in
+	  *' '* | *'	'* | *'
+'*	  | *'*'* | *'?'* | *'['*)
+	    echo "$0: invalid mode: $mode" >&2
+	    exit 1;;
+	esac
+	shift;;
+
+    -o) chowncmd="$chownprog $2"
+	shift;;
+
+    -s) stripcmd=$stripprog;;
+
+    -t) dst_arg=$2
+	shift;;
+
+    -T) no_target_directory=true;;
+
+    --version) echo "$0 $scriptversion"; exit $?;;
+
+    --)	shift
+	break;;
+
+    -*)	echo "$0: invalid option: $1" >&2
+	exit 1;;
+
+    *)  break;;
+  esac
+  shift
+done
+
+if test $# -ne 0 && test -z "$dir_arg$dst_arg"; then
+  # When -d is used, all remaining arguments are directories to create.
+  # When -t is used, the destination is already specified.
+  # Otherwise, the last argument is the destination.  Remove it from $@.
+  for arg
+  do
+    if test -n "$dst_arg"; then
+      # $@ is not empty: it contains at least $arg.
+      set fnord "$@" "$dst_arg"
+      shift # fnord
+    fi
+    shift # arg
+    dst_arg=$arg
+  done
+fi
+
+if test $# -eq 0; then
+  if test -z "$dir_arg"; then
+    echo "$0: no input file specified." >&2
+    exit 1
+  fi
+  # It's OK to call `install-sh -d' without argument.
+  # This can happen when creating conditional directories.
+  exit 0
+fi
+
+if test -z "$dir_arg"; then
+  trap '(exit $?); exit' 1 2 13 15
+
+  # Set umask so as not to create temps with too-generous modes.
+  # However, 'strip' requires both read and write access to temps.
+  case $mode in
+    # Optimize common cases.
+    *644) cp_umask=133;;
+    *755) cp_umask=22;;
+
+    *[0-7])
+      if test -z "$stripcmd"; then
+	u_plus_rw=
+      else
+	u_plus_rw='% 200'
+      fi
+      cp_umask=`expr '(' 777 - $mode % 1000 ')' $u_plus_rw`;;
+    *)
+      if test -z "$stripcmd"; then
+	u_plus_rw=
+      else
+	u_plus_rw=,u+rw
+      fi
+      cp_umask=$mode$u_plus_rw;;
+  esac
+fi
+
+for src
+do
+  # Protect names starting with `-'.
+  case $src in
+    -*) src=./$src;;
+  esac
+
+  if test -n "$dir_arg"; then
+    dst=$src
+    dstdir=$dst
+    test -d "$dstdir"
+    dstdir_status=$?
+  else
+
+    # Waiting for this to be detected by the "$cpprog $src $dsttmp" command
+    # might cause directories to be created, which would be especially bad
+    # if $src (and thus $dsttmp) contains '*'.
+    if test ! -f "$src" && test ! -d "$src"; then
+      echo "$0: $src does not exist." >&2
+      exit 1
+    fi
+
+    if test -z "$dst_arg"; then
+      echo "$0: no destination specified." >&2
+      exit 1
+    fi
+
+    dst=$dst_arg
+    # Protect names starting with `-'.
+    case $dst in
+      -*) dst=./$dst;;
+    esac
+
+    # If destination is a directory, append the input filename; won't work
+    # if double slashes aren't ignored.
+    if test -d "$dst"; then
+      if test -n "$no_target_directory"; then
+	echo "$0: $dst_arg: Is a directory" >&2
+	exit 1
+      fi
+      dstdir=$dst
+      dst=$dstdir/`basename "$src"`
+      dstdir_status=0
+    else
+      # Prefer dirname, but fall back on a substitute if dirname fails.
+      dstdir=`
+	(dirname "$dst") 2>/dev/null ||
+	expr X"$dst" : 'X\(.*[^/]\)//*[^/][^/]*/*$' \| \
+	     X"$dst" : 'X\(//\)[^/]' \| \
+	     X"$dst" : 'X\(//\)$' \| \
+	     X"$dst" : 'X\(/\)' \| . 2>/dev/null ||
+	echo X"$dst" |
+	    sed '/^X\(.*[^/]\)\/\/*[^/][^/]*\/*$/{
+		   s//\1/
+		   q
+		 }
+		 /^X\(\/\/\)[^/].*/{
+		   s//\1/
+		   q
+		 }
+		 /^X\(\/\/\)$/{
+		   s//\1/
+		   q
+		 }
+		 /^X\(\/\).*/{
+		   s//\1/
+		   q
+		 }
+		 s/.*/./; q'
+      `
+
+      test -d "$dstdir"
+      dstdir_status=$?
+    fi
+  fi
+
+  obsolete_mkdir_used=false
+
+  if test $dstdir_status != 0; then
+    case $posix_mkdir in
+      '')
+	# Create intermediate dirs using mode 755 as modified by the umask.
+	# This is like FreeBSD 'install' as of 1997-10-28.
+	umask=`umask`
+	case $stripcmd.$umask in
+	  # Optimize common cases.
+	  *[2367][2367]) mkdir_umask=$umask;;
+	  .*0[02][02] | .[02][02] | .[02]) mkdir_umask=22;;
+
+	  *[0-7])
+	    mkdir_umask=`expr $umask + 22 \
+	      - $umask % 100 % 40 + $umask % 20 \
+	      - $umask % 10 % 4 + $umask % 2
+	    `;;
+	  *) mkdir_umask=$umask,go-w;;
+	esac
+
+	# With -d, create the new directory with the user-specified mode.
+	# Otherwise, rely on $mkdir_umask.
+	if test -n "$dir_arg"; then
+	  mkdir_mode=-m$mode
+	else
+	  mkdir_mode=
+	fi
+
+	posix_mkdir=false
+	case $umask in
+	  *[123567][0-7][0-7])
+	    # POSIX mkdir -p sets u+wx bits regardless of umask, which
+	    # is incompatible with FreeBSD 'install' when (umask & 300) != 0.
+	    ;;
+	  *)
+	    tmpdir=${TMPDIR-/tmp}/ins$RANDOM-$$
+	    trap 'ret=$?; rmdir "$tmpdir/d" "$tmpdir" 2>/dev/null; exit $ret' 0
+
+	    if (umask $mkdir_umask &&
+		exec $mkdirprog $mkdir_mode -p -- "$tmpdir/d") >/dev/null 2>&1
+	    then
+	      if test -z "$dir_arg" || {
+		   # Check for POSIX incompatibilities with -m.
+		   # HP-UX 11.23 and IRIX 6.5 mkdir -m -p sets group- or
+		   # other-writeable bit of parent directory when it shouldn't.
+		   # FreeBSD 6.1 mkdir -m -p sets mode of existing directory.
+		   ls_ld_tmpdir=`ls -ld "$tmpdir"`
+		   case $ls_ld_tmpdir in
+		     d????-?r-*) different_mode=700;;
+		     d????-?--*) different_mode=755;;
+		     *) false;;
+		   esac &&
+		   $mkdirprog -m$different_mode -p -- "$tmpdir" && {
+		     ls_ld_tmpdir_1=`ls -ld "$tmpdir"`
+		     test "$ls_ld_tmpdir" = "$ls_ld_tmpdir_1"
+		   }
+		 }
+	      then posix_mkdir=:
+	      fi
+	      rmdir "$tmpdir/d" "$tmpdir"
+	    else
+	      # Remove any dirs left behind by ancient mkdir implementations.
+	      rmdir ./$mkdir_mode ./-p ./-- 2>/dev/null
+	    fi
+	    trap '' 0;;
+	esac;;
+    esac
+
+    if
+      $posix_mkdir && (
+	umask $mkdir_umask &&
+	$doit_exec $mkdirprog $mkdir_mode -p -- "$dstdir"
+      )
+    then :
+    else
+
+      # The umask is ridiculous, or mkdir does not conform to POSIX,
+      # or it failed possibly due to a race condition.  Create the
+      # directory the slow way, step by step, checking for races as we go.
+
+      case $dstdir in
+	/*) prefix='/';;
+	-*) prefix='./';;
+	*)  prefix='';;
+      esac
+
+      eval "$initialize_posix_glob"
+
+      oIFS=$IFS
+      IFS=/
+      $posix_glob set -f
+      set fnord $dstdir
+      shift
+      $posix_glob set +f
+      IFS=$oIFS
+
+      prefixes=
+
+      for d
+      do
+	test -z "$d" && continue
+
+	prefix=$prefix$d
+	if test -d "$prefix"; then
+	  prefixes=
+	else
+	  if $posix_mkdir; then
+	    (umask=$mkdir_umask &&
+	     $doit_exec $mkdirprog $mkdir_mode -p -- "$dstdir") && break
+	    # Don't fail if two instances are running concurrently.
+	    test -d "$prefix" || exit 1
+	  else
+	    case $prefix in
+	      *\'*) qprefix=`echo "$prefix" | sed "s/'/'\\\\\\\\''/g"`;;
+	      *) qprefix=$prefix;;
+	    esac
+	    prefixes="$prefixes '$qprefix'"
+	  fi
+	fi
+	prefix=$prefix/
+      done
+
+      if test -n "$prefixes"; then
+	# Don't fail if two instances are running concurrently.
+	(umask $mkdir_umask &&
+	 eval "\$doit_exec \$mkdirprog $prefixes") ||
+	  test -d "$dstdir" || exit 1
+	obsolete_mkdir_used=true
+      fi
+    fi
+  fi
+
+  if test -n "$dir_arg"; then
+    { test -z "$chowncmd" || $doit $chowncmd "$dst"; } &&
+    { test -z "$chgrpcmd" || $doit $chgrpcmd "$dst"; } &&
+    { test "$obsolete_mkdir_used$chowncmd$chgrpcmd" = false ||
+      test -z "$chmodcmd" || $doit $chmodcmd $mode "$dst"; } || exit 1
+  else
+
+    # Make a couple of temp file names in the proper directory.
+    dsttmp=$dstdir/_inst.$$_
+    rmtmp=$dstdir/_rm.$$_
+
+    # Trap to clean up those temp files at exit.
+    trap 'ret=$?; rm -f "$dsttmp" "$rmtmp" && exit $ret' 0
+
+    # Copy the file name to the temp name.
+    (umask $cp_umask && $doit_exec $cpprog "$src" "$dsttmp") &&
+
+    # and set any options; do chmod last to preserve setuid bits.
+    #
+    # If any of these fail, we abort the whole thing.  If we want to
+    # ignore errors from any of these, just make sure not to ignore
+    # errors from the above "$doit $cpprog $src $dsttmp" command.
+    #
+    { test -z "$chowncmd" || $doit $chowncmd "$dsttmp"; } &&
+    { test -z "$chgrpcmd" || $doit $chgrpcmd "$dsttmp"; } &&
+    { test -z "$stripcmd" || $doit $stripcmd "$dsttmp"; } &&
+    { test -z "$chmodcmd" || $doit $chmodcmd $mode "$dsttmp"; } &&
+
+    # If -C, don't bother to copy if it wouldn't change the file.
+    if $copy_on_change &&
+       old=`LC_ALL=C ls -dlL "$dst"	2>/dev/null` &&
+       new=`LC_ALL=C ls -dlL "$dsttmp"	2>/dev/null` &&
+
+       eval "$initialize_posix_glob" &&
+       $posix_glob set -f &&
+       set X $old && old=:$2:$4:$5:$6 &&
+       set X $new && new=:$2:$4:$5:$6 &&
+       $posix_glob set +f &&
+
+       test "$old" = "$new" &&
+       $cmpprog "$dst" "$dsttmp" >/dev/null 2>&1
+    then
+      rm -f "$dsttmp"
+    else
+      # Rename the file to the real destination.
+      $doit $mvcmd -f "$dsttmp" "$dst" 2>/dev/null ||
+
+      # The rename failed, perhaps because mv can't rename something else
+      # to itself, or perhaps because mv is so ancient that it does not
+      # support -f.
+      {
+	# Now remove or move aside any old file at destination location.
+	# We try this two ways since rm can't unlink itself on some
+	# systems and the destination file might be busy for other
+	# reasons.  In this case, the final cleanup might fail but the new
+	# file should still install successfully.
+	{
+	  test ! -f "$dst" ||
+	  $doit $rmcmd -f "$dst" 2>/dev/null ||
+	  { $doit $mvcmd -f "$dst" "$rmtmp" 2>/dev/null &&
+	    { $doit $rmcmd -f "$rmtmp" 2>/dev/null; :; }
+	  } ||
+	  { echo "$0: cannot unlink or rename $dst" >&2
+	    (exit 1); exit 1
+	  }
+	} &&
+
+	# Now rename the file to the real destination.
+	$doit $mvcmd "$dsttmp" "$dst"
+      }
+    fi || exit 1
+
+    trap '' 0
+  fi
+done
+
+# Local variables:
+# eval: (add-hook 'write-file-hooks 'time-stamp)
+# time-stamp-start: "scriptversion="
+# time-stamp-format: "%:y-%02m-%02d.%02H"
+# time-stamp-end: "$"
+# End:
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/ltmain.sh
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/ltmain.sh
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/mgiza.anjuta
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/mgiza.anjuta
@ -0,0 +1,37 @@
+<?xml version="1.0"?>
+<anjuta>
+    <plugin name="GBF Project Manager"
+            url="http://anjuta.org/plugins/"
+            mandatory="yes">
+		<require group="Anjuta Plugin"
+                 attribute="Interfaces"
+                 value="IAnjutaProjectManager"/>
+		<require group="Project"
+                 attribute="Supported-Project-Types"
+                 value="automake"/>
+	</plugin>
+	<plugin name="Make Build System"
+            url="http://anjuta.org/plugins/"
+            mandatory="yes">
+		<require group="Anjuta Plugin"
+                 attribute="Interfaces"
+                 value="IAnjutaBuildable"/>
+		<require group="Build"
+                 attribute="Supported-Build-Types"
+                 value="make"/>
+	</plugin>
+	<plugin name="Task Manager"
+            url="http://anjuta.org/plugins/"
+            mandatory="no">
+		<require group="Anjuta Plugin"
+                 attribute="Interfaces"
+                 value="IAnjutaTodo"/>
+	</plugin>
+	<plugin name="Debug Manager"
+            url="http://anjuta.org/plugins/"
+            mandatory="no">
+		<require group="Anjuta Plugin"
+                 attribute="Interfaces"
+                 value="IAnjutaDebuggerManager"/>
+	</plugin>
+</anjuta>
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/missing
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/missing
@ -0,0 +1,367 @@
+#! /bin/sh
+# Common stub for a few missing GNU programs while installing.
+
+scriptversion=2006-05-10.23
+
+# Copyright (C) 1996, 1997, 1999, 2000, 2002, 2003, 2004, 2005, 2006
+#   Free Software Foundation, Inc.
+# Originally by Fran,cois Pinard <pinard@iro.umontreal.ca>, 1996.
+
+# This program is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2, or (at your option)
+# any later version.
+
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+
+# You should have received a copy of the GNU General Public License
+# along with this program; if not, write to the Free Software
+# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
+# 02110-1301, USA.
+
+# As a special exception to the GNU General Public License, if you
+# distribute this file as part of a program that contains a
+# configuration script generated by Autoconf, you may include it under
+# the same distribution terms that you use for the rest of that program.
+
+if test $# -eq 0; then
+  echo 1>&2 "Try \`$0 --help' for more information"
+  exit 1
+fi
+
+run=:
+sed_output='s/.* --output[ =]\([^ ]*\).*/\1/p'
+sed_minuso='s/.* -o \([^ ]*\).*/\1/p'
+
+# In the cases where this matters, `missing' is being run in the
+# srcdir already.
+if test -f configure.ac; then
+  configure_ac=configure.ac
+else
+  configure_ac=configure.in
+fi
+
+msg="missing on your system"
+
+case $1 in
+--run)
+  # Try to run requested program, and just exit if it succeeds.
+  run=
+  shift
+  "$@" && exit 0
+  # Exit code 63 means version mismatch.  This often happens
+  # when the user try to use an ancient version of a tool on
+  # a file that requires a minimum version.  In this case we
+  # we should proceed has if the program had been absent, or
+  # if --run hadn't been passed.
+  if test $? = 63; then
+    run=:
+    msg="probably too old"
+  fi
+  ;;
+
+  -h|--h|--he|--hel|--help)
+    echo "\
+$0 [OPTION]... PROGRAM [ARGUMENT]...
+
+Handle \`PROGRAM [ARGUMENT]...' for when PROGRAM is missing, or return an
+error status if there is no known handling for PROGRAM.
+
+Options:
+  -h, --help      display this help and exit
+  -v, --version   output version information and exit
+  --run           try to run the given command, and emulate it if it fails
+
+Supported PROGRAM values:
+  aclocal      touch file \`aclocal.m4'
+  autoconf     touch file \`configure'
+  autoheader   touch file \`config.h.in'
+  autom4te     touch the output file, or create a stub one
+  automake     touch all \`Makefile.in' files
+  bison        create \`y.tab.[ch]', if possible, from existing .[ch]
+  flex         create \`lex.yy.c', if possible, from existing .c
+  help2man     touch the output file
+  lex          create \`lex.yy.c', if possible, from existing .c
+  makeinfo     touch the output file
+  tar          try tar, gnutar, gtar, then tar without non-portable flags
+  yacc         create \`y.tab.[ch]', if possible, from existing .[ch]
+
+Send bug reports to <bug-automake@gnu.org>."
+    exit $?
+    ;;
+
+  -v|--v|--ve|--ver|--vers|--versi|--versio|--version)
+    echo "missing $scriptversion (GNU Automake)"
+    exit $?
+    ;;
+
+  -*)
+    echo 1>&2 "$0: Unknown \`$1' option"
+    echo 1>&2 "Try \`$0 --help' for more information"
+    exit 1
+    ;;
+
+esac
+
+# Now exit if we have it, but it failed.  Also exit now if we
+# don't have it and --version was passed (most likely to detect
+# the program).
+case $1 in
+  lex|yacc)
+    # Not GNU programs, they don't have --version.
+    ;;
+
+  tar)
+    if test -n "$run"; then
+       echo 1>&2 "ERROR: \`tar' requires --run"
+       exit 1
+    elif test "x$2" = "x--version" || test "x$2" = "x--help"; then
+       exit 1
+    fi
+    ;;
+
+  *)
+    if test -z "$run" && ($1 --version) > /dev/null 2>&1; then
+       # We have it, but it failed.
+       exit 1
+    elif test "x$2" = "x--version" || test "x$2" = "x--help"; then
+       # Could not run --version or --help.  This is probably someone
+       # running `$TOOL --version' or `$TOOL --help' to check whether
+       # $TOOL exists and not knowing $TOOL uses missing.
+       exit 1
+    fi
+    ;;
+esac
+
+# If it does not exist, or fails to run (possibly an outdated version),
+# try to emulate it.
+case $1 in
+  aclocal*)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+         you modified \`acinclude.m4' or \`${configure_ac}'.  You might want
+         to install the \`Automake' and \`Perl' packages.  Grab them from
+         any GNU archive site."
+    touch aclocal.m4
+    ;;
+
+  autoconf)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+         you modified \`${configure_ac}'.  You might want to install the
+         \`Autoconf' and \`GNU m4' packages.  Grab them from any GNU
+         archive site."
+    touch configure
+    ;;
+
+  autoheader)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+         you modified \`acconfig.h' or \`${configure_ac}'.  You might want
+         to install the \`Autoconf' and \`GNU m4' packages.  Grab them
+         from any GNU archive site."
+    files=`sed -n 's/^[ ]*A[CM]_CONFIG_HEADER(\([^)]*\)).*/\1/p' ${configure_ac}`
+    test -z "$files" && files="config.h"
+    touch_files=
+    for f in $files; do
+      case $f in
+      *:*) touch_files="$touch_files "`echo "$f" |
+				       sed -e 's/^[^:]*://' -e 's/:.*//'`;;
+      *) touch_files="$touch_files $f.in";;
+      esac
+    done
+    touch $touch_files
+    ;;
+
+  automake*)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+         you modified \`Makefile.am', \`acinclude.m4' or \`${configure_ac}'.
+         You might want to install the \`Automake' and \`Perl' packages.
+         Grab them from any GNU archive site."
+    find . -type f -name Makefile.am -print |
+	   sed 's/\.am$/.in/' |
+	   while read f; do touch "$f"; done
+    ;;
+
+  autom4te)
+    echo 1>&2 "\
+WARNING: \`$1' is needed, but is $msg.
+         You might have modified some files without having the
+         proper tools for further handling them.
+         You can get \`$1' as part of \`Autoconf' from any GNU
+         archive site."
+
+    file=`echo "$*" | sed -n "$sed_output"`
+    test -z "$file" && file=`echo "$*" | sed -n "$sed_minuso"`
+    if test -f "$file"; then
+	touch $file
+    else
+	test -z "$file" || exec >$file
+	echo "#! /bin/sh"
+	echo "# Created by GNU Automake missing as a replacement of"
+	echo "#  $ $@"
+	echo "exit 0"
+	chmod +x $file
+	exit 1
+    fi
+    ;;
+
+  bison|yacc)
+    echo 1>&2 "\
+WARNING: \`$1' $msg.  You should only need it if
+         you modified a \`.y' file.  You may need the \`Bison' package
+         in order for those modifications to take effect.  You can get
+         \`Bison' from any GNU archive site."
+    rm -f y.tab.c y.tab.h
+    if test $# -ne 1; then
+        eval LASTARG="\${$#}"
+	case $LASTARG in
+	*.y)
+	    SRCFILE=`echo "$LASTARG" | sed 's/y$/c/'`
+	    if test -f "$SRCFILE"; then
+	         cp "$SRCFILE" y.tab.c
+	    fi
+	    SRCFILE=`echo "$LASTARG" | sed 's/y$/h/'`
+	    if test -f "$SRCFILE"; then
+	         cp "$SRCFILE" y.tab.h
+	    fi
+	  ;;
+	esac
+    fi
+    if test ! -f y.tab.h; then
+	echo >y.tab.h
+    fi
+    if test ! -f y.tab.c; then
+	echo 'main() { return 0; }' >y.tab.c
+    fi
+    ;;
+
+  lex|flex)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+         you modified a \`.l' file.  You may need the \`Flex' package
+         in order for those modifications to take effect.  You can get
+         \`Flex' from any GNU archive site."
+    rm -f lex.yy.c
+    if test $# -ne 1; then
+        eval LASTARG="\${$#}"
+	case $LASTARG in
+	*.l)
+	    SRCFILE=`echo "$LASTARG" | sed 's/l$/c/'`
+	    if test -f "$SRCFILE"; then
+	         cp "$SRCFILE" lex.yy.c
+	    fi
+	  ;;
+	esac
+    fi
+    if test ! -f lex.yy.c; then
+	echo 'main() { return 0; }' >lex.yy.c
+    fi
+    ;;
+
+  help2man)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+	 you modified a dependency of a manual page.  You may need the
+	 \`Help2man' package in order for those modifications to take
+	 effect.  You can get \`Help2man' from any GNU archive site."
+
+    file=`echo "$*" | sed -n "$sed_output"`
+    test -z "$file" && file=`echo "$*" | sed -n "$sed_minuso"`
+    if test -f "$file"; then
+	touch $file
+    else
+	test -z "$file" || exec >$file
+	echo ".ab help2man is required to generate this page"
+	exit 1
+    fi
+    ;;
+
+  makeinfo)
+    echo 1>&2 "\
+WARNING: \`$1' is $msg.  You should only need it if
+         you modified a \`.texi' or \`.texinfo' file, or any other file
+         indirectly affecting the aspect of the manual.  The spurious
+         call might also be the consequence of using a buggy \`make' (AIX,
+         DU, IRIX).  You might want to install the \`Texinfo' package or
+         the \`GNU make' package.  Grab either from any GNU archive site."
+    # The file to touch is that specified with -o ...
+    file=`echo "$*" | sed -n "$sed_output"`
+    test -z "$file" && file=`echo "$*" | sed -n "$sed_minuso"`
+    if test -z "$file"; then
+      # ... or it is the one specified with @setfilename ...
+      infile=`echo "$*" | sed 's/.* \([^ ]*\) *$/\1/'`
+      file=`sed -n '
+	/^@setfilename/{
+	  s/.* \([^ ]*\) *$/\1/
+	  p
+	  q
+	}' $infile`
+      # ... or it is derived from the source name (dir/f.texi becomes f.info)
+      test -z "$file" && file=`echo "$infile" | sed 's,.*/,,;s,.[^.]*$,,'`.info
+    fi
+    # If the file does not exist, the user really needs makeinfo;
+    # let's fail without touching anything.
+    test -f $file || exit 1
+    touch $file
+    ;;
+
+  tar)
+    shift
+
+    # We have already tried tar in the generic part.
+    # Look for gnutar/gtar before invocation to avoid ugly error
+    # messages.
+    if (gnutar --version > /dev/null 2>&1); then
+       gnutar "$@" && exit 0
+    fi
+    if (gtar --version > /dev/null 2>&1); then
+       gtar "$@" && exit 0
+    fi
+    firstarg="$1"
+    if shift; then
+	case $firstarg in
+	*o*)
+	    firstarg=`echo "$firstarg" | sed s/o//`
+	    tar "$firstarg" "$@" && exit 0
+	    ;;
+	esac
+	case $firstarg in
+	*h*)
+	    firstarg=`echo "$firstarg" | sed s/h//`
+	    tar "$firstarg" "$@" && exit 0
+	    ;;
+	esac
+    fi
+
+    echo 1>&2 "\
+WARNING: I can't seem to be able to run \`tar' with the given arguments.
+         You may want to install GNU tar or Free paxutils, or check the
+         command line arguments."
+    exit 1
+    ;;
+
+  *)
+    echo 1>&2 "\
+WARNING: \`$1' is needed, and is $msg.
+         You might have modified some files without having the
+         proper tools for further handling them.  Check the \`README' file,
+         it often tells you about the needed prerequisites for installing
+         this package.  You may also peek at any GNU archive site, in case
+         some other package would contain this missing \`$1' program."
+    exit 1
+    ;;
+esac
+
+exit 0
+
+# Local variables:
+# eval: (add-hook 'write-file-hooks 'time-stamp)
+# time-stamp-start: "scriptversion="
+# time-stamp-format: "%:y-%02m-%02d.%02H"
+# time-stamp-end: "$"
+# End:
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/TrimBlanks.sh
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/TrimBlanks.sh
@ -0,0 +1,2 @@
+sed -e 's/^[ \t]*//' -e 's/[ \t][ \t]*/ /g' -e 's/[ \t]*$//'
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/force-align-moses.sh
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/force-align-moses.sh
@ -0,0 +1,48 @@
+#!/usr/bin/env bash
+
+MGIZA=${QMT_HOME}/bin/mgiza
+
+if [ $# -lt 4 ]; then
+	echo "OK, this is simple, put me into your Moses training directory, link your source/target corpus" 1>&2
+	echo "and run " $0 " PREFIX src_tag tgt_tag root-dir." 1>&2
+	echo "and get force-aligned data: root-dir/giza.[src-tgt|tgt-src]/*.A3.final.* " 1>&2
+	echo "make sure I can find PREFIX.src_tag-tgt_tag and PREFIX.tgt_tag-src_tag, and \${QMT_HOME} is set" 1>&2
+	exit
+fi
+
+PRE=$1
+SRC=$2
+TGT=$3
+ROOT=$4
+
+mkdir -p $ROOT/giza.${SRC}-${TGT}
+mkdir -p $ROOT/giza.${TGT}-${SRC}
+mkdir -p $ROOT/corpus
+
+echo "Generating corpus file " 1>&2
+
+${QMT_HOME}/scripts/plain2snt-hasvcb.py corpus/$SRC.vcb corpus/$TGT.vcb ${PRE}.${SRC} ${PRE}.${TGT} $ROOT/corpus/${TGT}-${SRC}.snt $ROOT/corpus/${SRC}-${TGT}.snt $ROOT/corpus/$SRC.vcb $ROOT/corpus/$TGT.vcb
+
+ln -sf $PWD/corpus/$SRC.vcb.classes $PWD/corpus/$TGT.vcb.classes $ROOT/corpus/
+
+echo "Generating co-occurrence file " 1>&2
+
+${QMT_HOME}/bin/snt2cooc $ROOT/giza.${TGT}-${SRC}/$TGT-${SRC}.cooc $ROOT/corpus/$SRC.vcb $ROOT/corpus/$TGT.vcb $ROOT/corpus/${TGT}-${SRC}.snt
+${QMT_HOME}/bin//snt2cooc $ROOT/giza.${SRC}-${TGT}/$SRC-${TGT}.cooc $ROOT/corpus/$TGT.vcb $ROOT/corpus/$SRC.vcb $ROOT/corpus/${SRC}-${TGT}.snt
+
+echo "Running force alignment " 1>&2
+
+$MGIZA giza.$TGT-$SRC/$TGT-$SRC.gizacfg -c $ROOT/corpus/$TGT-$SRC.snt -o $ROOT/giza.${TGT}-${SRC}/$TGT-${SRC} \
+-s $ROOT/corpus/$SRC.vcb -t $ROOT/corpus/$TGT.vcb -m1 0 -m2 0 -mh 0 -coocurrence $ROOT/giza.${TGT}-${SRC}/$TGT-${SRC}.cooc \
+-restart 11 -previoust giza.$TGT-$SRC/$TGT-$SRC.t3.final \
+-previousa giza.$TGT-$SRC/$TGT-$SRC.a3.final -previousd giza.$TGT-$SRC/$TGT-$SRC.d3.final \
+-previousn giza.$TGT-$SRC/$TGT-$SRC.n3.final -previousd4 giza.$TGT-$SRC/$TGT-$SRC.d4.final \
+-previousd42 giza.$TGT-$SRC/$TGT-$SRC.D4.final -m3 0 -m4 1
+
+$MGIZA giza.$SRC-$TGT/$SRC-$TGT.gizacfg -c $ROOT/corpus/$SRC-$TGT.snt -o $ROOT/giza.${SRC}-${TGT}/$SRC-${TGT} \
+-s $ROOT/corpus/$TGT.vcb -t $ROOT/corpus/$SRC.vcb -m1 0 -m2 0 -mh 0 -coocurrence $ROOT/giza.${SRC}-${TGT}/$SRC-${TGT}.cooc \
+-restart 11 -previoust giza.$SRC-$TGT/$SRC-$TGT.t3.final \
+-previousa giza.$SRC-$TGT/$SRC-$TGT.a3.final -previousd giza.$SRC-$TGT/$SRC-$TGT.d3.final \
+-previousn giza.$SRC-$TGT/$SRC-$TGT.n3.final -previousd4 giza.$SRC-$TGT/$SRC-$TGT.d4.final \
+-previousd42 giza.$SRC-$TGT/$SRC-$TGT.D4.final -m3 0 -m4 1
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/giza2bal.pl
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/giza2bal.pl
@ -0,0 +1,112 @@
+#! /usr/bin/perl
+
+# $Id: giza2bal.pl 1562 2008-02-19 20:48:14Z redpony $
+#Converts direct and inverted alignments into a more compact 
+#bi-alignment format. It optionally reads the counting file 
+#produced by giza containing the frequency of each traning sentence.
+
+#Copyright Marcello Federico, November 2004
+
+($cnt,$dir,$inv)=();
+
+while ($w=shift @ARGV){
+  $dir=shift(@ARGV),next  if $w eq "-d";
+  $inv=shift(@ARGV),next  if $w eq "-i";
+  $cnt=shift(@ARGV),next  if $w eq "-c";
+} 
+
+my $lc = 0;
+
+if (!$dir || !inv){
+ print  "usage: giza2bal.pl [-c <count-file>] -d <dir-align-file> -i <inv-align-file>\n"; 
+ print  "input files can be also commands, e.g. -d \"gunzip -c file.gz\"\n";
+ exit(0);
+}
+
+$|=1;
+
+open(DIR,"<$dir") || open(DIR,"$dir|") || die "cannot open $dir\n";
+open(INV,"<$inv") || open(INV,"$inv|") || die "cannot open $dir\n";
+
+if ($cnt){
+open(CNT,"<$cnt") || open(CNT,"$cnt|") || die "cannot open $dir\n";
+}
+
+
+sub ReadBiAlign{
+    local($fd0,$fd1,$fd2,*s1,*s2,*a,*b,*c)=@_;
+    local($dummy,$n);
+
+    chop($c=<$fd0>); ## count
+    $dummy=<$fd0>; ## header
+    $dummy=<$fd0>; ## header
+    $c=1 if !$c;
+
+    $dummy=<$fd1>; ## header
+    chop($s1=<$fd1>);
+    chop($t1=<$fd1>);
+
+    $dummy=<$fd2>; ## header
+    chop($s2=<$fd2>);
+    chop($t2=<$fd2>);
+
+    @a=@b=();
+    $lc++;
+
+    #get target statistics
+    $n=1;
+    $t1=~s/NULL \(\{((\s+\d+)*)\s+\}\)//;
+    while ($t1=~s/(\S+)\s+\(\{((\s+\d+)*)\s+\}\)//){
+        grep($a[$_]=$n,split(/\s+/,$2));
+        $n++;
+    }
+
+    $m=1;
+    $t2=~s/NULL \(\{((\s+\d+)*)\s+\}\)//;
+    while ($t2=~s/(\S+)\s+\(\{((\s+\d+)*)\s+\}\)//){
+        grep($b[$_]=$m,split(/\s+/,$2));
+        $m++;
+    }
+
+    $M=split(/\s+/,$s1);
+    $N=split(/\s+/,$s2);
+
+    if ($m != ($M+1) || $n != ($N+1)) {
+      print STDERR "Sentence mismatch error! Line #$lc\n";
+      $s1 = "ALIGN_ERR";
+      $s2 = "ALIGN_ERR";
+      @a=(); @b=();
+      for ($j=1;$j<2;$j++){ $a[$j]=1; }
+      for ($i=1;$i<2;$i++){ $b[$i]=1; }
+      return 1;
+    }
+
+    for ($j=1;$j<$m;$j++){
+        $a[$j]=0 if !$a[$j];
+    }
+
+    for ($i=1;$i<$n;$i++){
+        $b[$i]=0 if !$b[$i];
+    }
+
+
+    return 1;
+}
+
+$skip=0;
+$ccc=0;
+while(!eof(DIR)){
+
+    if (ReadBiAlign(CNT,DIR,INV,*src,*tgt,*a,*b,*c))
+    {
+	$ccc++;
+        print "$c\n";
+        print $#a," $src \# @a[1..$#a]\n";
+        print $#b," $tgt \# @b[1..$#b]\n";
+    }
+    else{
+    	print "\n";
+        print STDERR "." if !(++$skip % 1000);
+    }
+};
+print STDERR "skip=<$skip> counts=<$ccc>\n";
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/merge_alignment.py
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/merge_alignment.py
@ -0,0 +1,80 @@
+#!/usr/bin/env python
+# Author : Qin Gao
+# Date   : Dec 31, 2007
+# Purpose: Combine multiple alignment files into a single one, the files are
+#          prodcuced by MGIZA, which has sentence IDs, and every file is 
+#          ordered inside
+
+import sys
+import re
+
+if len(sys.argv)<2:
+	sys.stderr.write("Provide me the file names (at least 2)\n");
+	sys.exit();
+
+sent_id = 0;
+
+files = [];
+ids = [];
+
+sents = [];
+done = [];
+
+for i in range(1,len(sys.argv)):
+	files.append(open(sys.argv[i],"r"));
+	ids.append(0);
+	sents.append("");
+	done.append(False);
+
+r = re.compile("\\((\\d+)\\)");	
+i = 0;
+while i< len(files):
+	st1 = files[i].readline();
+	st2 = files[i].readline();
+	st3 = files[i].readline();
+	if len(st1)==0 or len(st2)==0 or len(st3)==0:
+		done[i] = True;
+	else:
+		mt = r.search(st1);
+		id = int(mt.group(1));
+		ids[i] = id;
+		sents[i] = (st1, st2, st3);
+	i += 1
+		
+cont = True;
+while (cont):
+	sent_id += 1;
+	writeOne = False;
+# Now try to read more sentences
+	i = 0;
+	cont = False;
+	while i < len(files):
+		if done[i]:
+			i+=1
+			continue;
+		cont = True;
+		if ids[i] == sent_id:
+			sys.stdout.write("%s%s%s"%(sents[i][0],sents[i][1],sents[i][2]));
+			writeOne = True;
+			st1 = files[i].readline();
+			st2 = files[i].readline();
+			st3 = files[i].readline();
+			if len(st1)==0 or len(st2)==0 or len(st3)==0:
+				done[i] = True;
+			else:
+				mt = r.search(st1);
+				id = int(mt.group(1));
+				ids[i] = id;
+				sents[i] = (st1, st2, st3);
+				cont = True;
+			break;
+		elif ids[i] < sent_id:
+			sys.stderr.write("ERROR! DUPLICATED ENTRY %d\n" % ids[i]);
+			sys.exit();
+		else:
+			cont = True;
+		i+=1;
+	if (not writeOne) and cont:
+		sys.stderr.write("ERROR! MISSING ENTRy %d\n" % sent_id);
+		#sys.exit();
+sys.stderr.write("Combined %d files, totally %d sents \n" %(len(files),sent_id-1));
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/plain2snt-hasvcb.py
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/plain2snt-hasvcb.py
@ -0,0 +1,93 @@
+#!/usr/bin/env python
+
+from sys import *
+
+def loadvcb(fname,out):
+	dict={};
+	df = open(fname,"r");
+	for line in df:
+		out.write(line);
+		ws = line.strip().split();
+	        id = int(ws[0]);
+		wd = ws[1];
+		dict[wd]=id;
+	return dict;
+
+if len(argv)<9:
+	stderr.write("Error, the input should be \n");
+	stderr.write("%s evcb fvcb etxt ftxt esnt(out) fsnt(out) evcbx(out) fvcbx(out)\n" % argv[0]);
+	stderr.write("You should concatenate the evcbx and fvcbx to existing vcb files\n");
+	exit();
+
+ein = open(argv[3],"r");
+fin = open(argv[4],"r");
+
+eout = open(argv[5],"w");
+fout = open(argv[6],"w");
+
+evcbx = open(argv[7],"w");
+fvcbx = open(argv[8],"w");
+evcb = loadvcb(argv[1],evcbx);
+fvcb = loadvcb(argv[2],fvcbx);
+
+i=0
+while True:
+	i+=1;
+	eline=ein.readline();
+	fline=fin.readline();
+	if len(eline)==0 or len(fline)==0:
+		break;
+	ewords = eline.strip().split();
+	fwords = fline.strip().split();
+	el = [];
+	fl = [];
+	j=0;
+	for w in ewords:
+		j+=1
+		if evcb.has_key(w):
+			el.append(evcb[w]);
+		else:
+			if evcb.has_key(w.lower()):
+				el.append(evcb[w.lower()]);
+			else:
+				##stdout.write("#E %d %d %s\n" % (i,j,w))
+				#el.append(1);
+				nid = len(evcb)+1;
+				evcb[w.lower()] = nid;
+				evcbx.write("%d %s 1\n" % (nid, w));
+				el.append(nid);
+
+	j=0;
+	for w in fwords:
+		j+=1
+		if fvcb.has_key(w):
+			fl.append(fvcb[w]);
+		else:
+			if fvcb.has_key(w.lower()):
+				fl.append(fvcb[w.lower()]);
+			else:
+				#stdout.write("#F %d %d %s\n" % (i,j,w))
+				nid = len(fvcb)+1;
+				fvcb[w.lower()] = nid;
+				fvcbx.write("%d %s 1\n" % (nid, w));
+				fl.append(nid);
+				#fl.append(1);
+	eout.write("1\n");
+	fout.write("1\n");
+	for I in el:
+		eout.write("%d " % I);
+	eout.write("\n");
+	for I in fl:
+		eout.write("%d " % I);
+		fout.write("%d " % I);
+	eout.write("\n");
+	fout.write("\n");
+	for I in el:
+		fout.write("%d " % I);
+	fout.write("\n");
+
+fout.close();
+eout.close();
+fvcbx.close();
+evcbx.close();
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/sntpostproc.py
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/sntpostproc.py
@ -0,0 +1,116 @@
+#!/usr/bin/env python
+
+# This script post process the snt file -- either in single-line format or in multi-line format
+# The output, however, will always be in single-line format
+
+from sys import *
+from optparse import OptionParser
+import re;
+usage = """
+The script post process the snt file, the input could be single-line snt 
+file or multi-line, (triple line) and can insert sentence weight to the
+file (-w) or add partial alignment to the file (-a)
+Usage %prog -s sntfile -w weight-file -a alignfile -o outputfile
+"""
+parser = OptionParser(usage=usage)
+
+
+parser = OptionParser()
+
+parser.add_option("-s", "--snt", dest="snt",default=None,
+		help="The input snt file", metavar="FILE")
+
+parser.add_option("-w", "--weight", dest="weight",default=None,
+		help="The input weight file", metavar="FILE")
+
+
+parser.add_option("-o", "--output", dest="output",default="-",
+		help="The input partial alignment file, one sentence per line", metavar="FILE")
+
+parser.add_option("-a", "--align", dest="align",default=None,
+		help="The input partial alignment file, one sentence per line", metavar="FILE")
+
+
+(options, args) = parser.parse_args()
+
+if options.snt == None:
+	parser.print_help();
+	exit();
+else:
+	sfile = open(options.snt,"r");
+
+if options.output=="-":
+	ofile = stdout;
+else:
+	ofile = open(options.output,"w");
+
+wfile = None;
+
+if options.weight <> None:
+	wfile = open(options.weight,"r");
+
+afile = None;
+if options.align <> None:
+	afile = open(options.align,"r");
+
+rr = re.compile("[\\|\\#\\*]");
+wt = 0.0;
+al = {};
+e = "";
+f = "";
+
+def parse_ax(line):
+	alq = {};
+	als = line.strip().split(" ");
+	for e in als:
+		if len(e.strip())>0:
+			alo = e.split("-");
+			if len(alo)==2:
+				alq[tuple(alo)] = 1;
+	return alq;
+	
+
+
+
+
+
+while True:
+	l = sfile.readline();
+	if len(l) == 0:
+		break;
+	lp = rr.split(l.strip());
+	if len(lp)>=3:
+		wt = float(lp[0]);
+		e = lp[1];
+		f = lp[2];
+		if len(lp) > 3:
+			al = parse_ax(lp[3]);
+		else:
+			al = {};
+	else:
+		wt = float(l);
+		e = sfile.readline().strip();
+		f = sfile.readline().strip();
+		al={}
+	if wfile <> None:
+		lw = wfile.readline().strip();
+		if len(lw)>0:
+			wt = float(lw);
+		else:
+			wt = 1;
+	if afile <> None:
+		la = afile.readline().strip();
+		if len(la)>0:
+			al1 = parse_ax(la);
+			for entry in al1.keys():
+				al[entry] = 1;
+
+	ofile.write("%g | %s | %s" % (wt, e, f));
+	if len(al)>0:
+		ofile.write(" |");
+
+		for entry in al.keys():
+			ofile.write(" %s-%s" % entry);
+	ofile.write("\n");
+
+	
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/symal.sh
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/scripts/symal.sh
@ -0,0 +1,15 @@
+#!/usr/bin/env bash
+
+OUTPUT=$1
+shift
+GIZA2BAL=$1
+shift
+SYMAL=$1
+shift
+STOT=$1
+shift
+TTOS=$1
+shift
+
+perl $GIZA2BAL -d ${STOT} -i ${TTOS} | $SYMAL $* > $OUTPUT 
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/.cvsignore
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/.cvsignore
@ -0,0 +1,17 @@
+.libs
+.deps
+.*swp
+.nautilus-metafile.xml
+*.autosave
+*.bak
+*~
+#*#
+*.gladep
+*.la
+*.lo
+*.o
+*.class
+*.pyc
+*.plugin
+Makefile
+Makefile.in
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ATables.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ATables.cpp
@ -0,0 +1,212 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#include "ATables.h" 
+#include "Globals.h"
+#include "myassert.h"
+#include "Parameter.h"
+
+GLOBAL_PARAMETER(bool,CompactADTable,"compactadtable","1: only 3-dimensional alignment table for IBM-2 and IBM-3",PARLEV_MODELS,1);
+GLOBAL_PARAMETER(float,amodel_smooth_factor,"model23SmoothFactor","smoothing parameter for IBM-2/3 (interpolation with constant)",PARLEV_SMOOTH,0.0);
+
+template <class VALTYPE>
+void amodel<VALTYPE>::printTable(const char *filename) const{
+  // print amodel to file with the name filename (it'll be created or overwritten 
+  // format : for a table : 
+  //              aj j l m  val 
+  // where aj is source word pos, j target word pos, l source sentence length, 
+  //       m is target sentence length.
+  //          
+  //return;
+    if (is_distortion)
+        cout << "Dumping pruned distortion table (d) to file:" << filename <<'\n';
+    else 
+        cout << "Dumping pruned alignment table (a) to file:" << filename <<'\n';
+    
+    ofstream of(filename);
+    double ssum=0.0;
+    for(WordIndex l=0; l < MaxSentLength; l++){
+        for(WordIndex m=0;m<MaxSentLength;m++){
+            if( CompactADTable && l!=m )
+                continue;
+            unsigned int L=((CompactADTable&&is_distortion)?MaxSentLength:(l+1))-1;
+            unsigned int M=((CompactADTable&&!is_distortion)?MaxSentLength:(m+1))-1;
+            if( is_distortion==0 ){
+                for(WordIndex j=1;j<=M; j++){
+                    double sum=0.0;
+                    for(WordIndex i=0;i<=L; i++){
+                        VALTYPE x=getValue(i, j, L, M); 
+                        if( x>PROB_SMOOTH ){
+                            of << i << ' ' << j << ' ' << L << ' ' << M << ' ' << x << '\n';
+                            sum+=x;
+                        }
+                    }
+                    ssum+=sum;
+                }
+            }else{
+                for(WordIndex i=0;i<=L;i++){
+                    double sum=0.0;
+                    for(WordIndex j=1;j<=M;j++){
+                        VALTYPE x=getValue(j, i, L, M);
+                        if( x>PROB_SMOOTH ){
+                            of << j << ' ' << i << ' ' << L << ' ' << M << ' ' << x << '\n';
+                            sum+=x;
+                        }
+                    }
+                    ssum+=sum;
+                }
+            }
+        }
+    }
+}
+
+template <class VALTYPE>
+void amodel<VALTYPE>::printRealTable(const char *filename) const{
+  // print amodel to file with the name filename (it'll be created or overwritten 
+  // format : for a table : 
+  //              aj j l m  val 
+  // where aj is source word pos, j target word pos, l source sentence length, 
+  //       m is target sentence length.
+  //          
+  //return;
+    if (is_distortion)
+        cout << "Dumping not pruned distortion table (d) to file:" << filename <<'\n';
+    else 
+        cout << "Dumping not pruned alignment table (a) to file:" << filename <<'\n';
+    
+    ofstream of(filename);
+    for(WordIndex l=0; l < MaxSentLength; l++){
+        for(WordIndex m=0;m<MaxSentLength;m++){
+            if(  CompactADTable && l!=m )
+                continue;
+            unsigned int L=((CompactADTable&&is_distortion)?MaxSentLength:(l+1))-1;
+            unsigned int M=((CompactADTable&&!is_distortion)?MaxSentLength:(m+1))-1;
+            if( is_distortion==0 ){
+                for(WordIndex j=1;j<=M; j++){
+                    for(WordIndex i=0;i<=L; i++){
+                        VALTYPE x=getValue(i, j, L, M); 
+						if( x>MINCOUNTINCREASE )
+                        of << i << ' ' << j << ' ' << L << ' ' << M << ' ' << x << '\n';
+                    }
+                }
+            }else{
+                for(WordIndex i=0;i<=L;i++){
+                    for(WordIndex j=1;j<=M;j++){
+                        VALTYPE x=getValue(j, i, L, M);
+						if( x>MINCOUNTINCREASE )
+                        of << j << ' ' << i << ' ' << L << ' ' << M << ' ' << x << '\n';                   
+                    }
+                }
+            }
+        }
+    }
+}
+
+extern short NoEmptyWord;
+
+template <class VALTYPE>
+bool amodel<VALTYPE>::readTable(const char *filename){
+  /* This function reads the a table from a file.
+     Each line is of the format:  aj j l m  val
+     where aj is the source word position, j the target word position, 
+     l the source sentence length, and m the target sentence length
+     
+     This function also works for a d table, where the positions
+     of aj and i are swapped.  Both the a and d tables are 4 dimensional
+     hashes; this function will simply read in the four values and keep
+     them in that order when hashing the fifth value.
+     NAS, 7/11/99
+  */
+    ifstream inf(filename);
+    cout << "Reading a/d table from " << filename << "\n";
+    if(!inf){
+        cerr << "\nERROR: Cannot open " << filename<<"\n";
+        return false;
+    }
+    WordIndex w, x, l, m;
+    VALTYPE prob;
+    while(inf >> w >> x >> l >> m >> prob )
+        // the NULL word is added to the length
+        // of the sentence in the tables, but discount it when you write the tables. 
+        setValue(w, x, l, m, prob);
+    return true;
+}
+
+template <class VALTYPE>
+bool amodel<VALTYPE>::readAugTable(const char *filename){
+  /* This function reads the a table from a file.
+     Each line is of the format:  aj j l m  val
+     where aj is the source word position, j the target word position, 
+     l the source sentence length, and m the target sentence length
+     
+     This function also works for a d table, where the positions
+     of aj and i are swapped.  Both the a and d tables are 4 dimensional
+     hashes; this function will simply read in the four values and keep
+     them in that order when hashing the fifth value.
+     NAS, 7/11/99
+  */
+    ifstream inf(filename);
+    cout << "Reading a/d table from " << filename << "\n";
+    if(!inf){
+        cerr << "\nERROR: Cannot open " << filename<<"\n";
+        return false;
+    }
+    WordIndex w, x, l, m;
+    VALTYPE prob;
+    while(inf >> w >> x >> l >> m >> prob )
+        // the NULL word is added to the length
+        // of the sentence in the tables, but discount it when you write the tables. 
+        addValue(w, x, l, m, prob);
+    return true;
+}
+
+template <class VALTYPE>
+bool amodel<VALTYPE>::merge(amodel<VALTYPE>& am){
+    cout << "start merging " <<"\n";
+    for(WordIndex l=0; l < MaxSentLength; l++){
+        for(WordIndex m=0;m<MaxSentLength;m++){
+            if(  CompactADTable && l!=m )
+                continue;
+            unsigned int L=((CompactADTable&&is_distortion)?MaxSentLength:(l+1))-1;
+            unsigned int M=((CompactADTable&&!is_distortion)?MaxSentLength:(m+1))-1;
+            if( is_distortion==0 ){
+                for(WordIndex j=1;j<=M; j++){
+                    for(WordIndex i=0;i<=L; i++){
+                        VALTYPE x=am.getValue(i, j, L, M); 
+                        addValue(i,j,L,M,x);
+                    }
+                }
+            }else{
+                for(WordIndex i=0;i<=L;i++){
+                    for(WordIndex j=1;j<=M;j++){
+                        VALTYPE x=am.getValue(j, i, L, M);
+                        addValue(j,i,L,M,x);
+                    }
+                }
+            }
+        }
+    }
+    return true;
+}
+
+
+template class amodel<COUNT> ; 
+//template class amodel<PROB> ; 
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ATables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ATables.h
@ -0,0 +1,191 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* --------------------------------------------------------------------------*
+ *                                                                           *
+ * Module :ATables                                                           *
+ *                                                                           *
+ * Prototypes File: ATables.h                                                *
+ *                                                                           *
+ * Objective: Defines clases and methods for handling I/O for distortion  &  *
+ *            alignment tables.                                              *
+ *****************************************************************************/
+
+#ifndef _atables_h
+#define _atables_h 1
+
+#include "defs.h"
+#include <cassert>
+#include <iostream>
+#include <algorithm>
+#include <functional>
+#include <map>
+#include <set>
+#include "Vector.h"
+#include <utility>
+#if __GNUC__>2
+#include <ext/hash_map>
+using __gnu_cxx::hash_map;
+#else
+#include <hash_map>
+#endif
+#include <fstream>
+#include "Array4.h"
+#include "myassert.h"
+#include "Globals.h"
+#include "syncObj.h"
+
+extern bool CompactADTable;
+extern float amodel_smooth_factor;
+extern short NoEmptyWord;
+
+/* ------------------- Class Defintions of amodel ---------------------------*/
+/* Class Name: amodel:
+   Objective: This defines the underlying data structure for distortiont prob.
+   and count tables. They are defined as a hash table. Each entry in the hash
+   table is the probability (d(j/l,m,i), where j is word target position, i is
+   source word position connected to it, m is target sentence length, and l is
+   source sentence length) or count collected for it. The  probability and the
+   count are represented as log integer probability as 
+   defined by the class LogProb .  
+
+  This class is used to represents a Tables (probabiliity) and d (distortion)
+  tables and also their corresponding count tables .
+  
+  *--------------------------------------------------------------------------*/
+
+inline int Mabs(int a){
+    if(a<0)
+        return -a;
+    else
+        return a;
+}
+
+template <class VALTYPE>
+class amodel{
+public:
+    Array4<VALTYPE> a;
+    bool is_distortion ; 
+    WordIndex MaxSentLength;
+    bool ignoreL, ignoreM;
+    VALTYPE get(WordIndex aj, WordIndex j, WordIndex l, WordIndex m)const{
+        massert( (!is_distortion) || aj<=m );massert( (!is_distortion) || j<=l );massert( (!is_distortion) || aj!=0 );
+        massert( is_distortion    || aj<=l );massert( is_distortion    || j<=m );massert( (is_distortion) || j!=0 );
+        massert( l<MaxSentLength );massert( m<MaxSentLength );
+        return a.get(aj, j, (CompactADTable&&is_distortion)?MaxSentLength:(l+1),(CompactADTable&&!is_distortion)?MaxSentLength:(m+1));
+    }
+    
+    static float smooth_factor;
+    amodel(bool flag = false)
+        : a(MAX_SENTENCE_LENGTH+1,0.0), is_distortion(flag), MaxSentLength(MAX_SENTENCE_LENGTH)
+    {}; 
+    
+protected:
+    VALTYPE&getRef(WordIndex aj, WordIndex j, WordIndex l, WordIndex m){
+        massert( (!is_distortion) || aj<=m );massert( (!is_distortion) || j<=l );
+        massert( is_distortion    || aj<=l );massert( is_distortion    || j<=m );massert( (is_distortion) || j!=0 );
+        massert( l<MaxSentLength );massert( m<MaxSentLength );
+        return a(aj, j, (CompactADTable&&is_distortion)?MaxSentLength:(l+1),(CompactADTable&&!is_distortion)?MaxSentLength:(m+1));
+    }
+public:
+    void setValue(WordIndex aj, WordIndex j, WordIndex l, WordIndex m, VALTYPE val) {
+    	lock.lock();
+        getRef(aj, j, l, m)=val;
+        lock.unlock();
+    }
+    
+    Mutex lock;
+public:
+    /**
+    By Qin
+    */
+    void addValue(WordIndex aj, WordIndex j, WordIndex l, WordIndex m, VALTYPE val) {
+    	lock.lock();
+        getRef(aj, j, l, m)+=val;
+        lock.unlock();
+    }
+    bool merge(amodel<VALTYPE>& am);
+    VALTYPE getValue(WordIndex aj, WordIndex j, WordIndex l, WordIndex m) const{
+        if( is_distortion==0 )
+            return max(double(PROB_SMOOTH),amodel_smooth_factor/(l+1)+(1.0-amodel_smooth_factor)*get(aj, j, l, m));
+        else
+            return max(double(PROB_SMOOTH),amodel_smooth_factor/m+(1.0-amodel_smooth_factor)*get(aj, j, l, m));	
+    }
+    
+    void printTable(const char* filename)const ; 
+    void printRealTable(const char* filename)const ; 
+    template<class COUNT>
+        void normalize(amodel<COUNT>& aTable)const
+    {
+        WordIndex i, j, l, m ;
+        COUNT total;
+        int nParam=0;
+        for(l=0;l<MaxSentLength;l++){
+            for(m=0;m<MaxSentLength;m++){
+                if( CompactADTable && l!=m )
+                    continue;
+                unsigned int L=((CompactADTable&&is_distortion)?MaxSentLength:(l+1))-1;
+                unsigned int M=((CompactADTable&&!is_distortion)?MaxSentLength:(m+1))-1;
+                if( is_distortion==0 ){
+                    for(j=1;j<=M; j++){
+                        total=0.0;
+                        for(i=0;i<=L;i++){
+                            total+=get(i, j, L, M);
+                        }
+                        if( total ){
+                            for(i=0;i<=L;i++){
+                                nParam++;
+                                aTable.getRef(i, j, L, M)=get(i, j, L, M)/total;
+                                massert(aTable.getRef(i,j,L,M)<=1.0);
+                                if( NoEmptyWord&&i==0 )
+                                    aTable.getRef(i,j,L,M)=0;
+                            }
+                        }
+                    }
+                }else{
+                    for(i=0;i<=L;i++){
+                        total=0.0;
+                        for(j=1;j<=M;j++)
+                            total+=get(j, i, L, M);
+                        if( total )
+                            for(j=1;j<=M;j++){
+                                aTable.getRef(j, i, L, M)=amodel_smooth_factor/M+(1.0-amodel_smooth_factor)*get(j, i, L, M)/total;
+                                nParam++;
+                                massert(aTable.getRef(j,i,L,M)<=1.0);
+                                if( NoEmptyWord&&i==0 )
+                                    aTable.getRef(j,i,L,M)=0;
+                            }
+                    }
+                }
+            }
+        }
+        cout << "A/D table contains " << nParam << " parameters.\n";
+    }
+    
+    bool readTable(const char *filename); 
+    bool readAugTable(const char *filename); 
+    void clear()
+    {a.clear();}
+};
+
+/* ------------------- End of amodel Class Definitions ----------------------*/
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/AlignTables.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/AlignTables.cpp
@ -0,0 +1,44 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#include "AlignTables.h"
+
+bool alignmodel::insert(Vector<WordIndex>& aj, LogProb val)
+{
+  hash_map<Vector<WordIndex>, LogProb, hashmyalignment, equal_to_myalignment >::iterator i;
+  i = a.find(aj);
+  if(i != a.end() || val <= 0)
+    return false ;
+  a.insert(pair<const Vector<WordIndex>, LogProb>(aj, val));
+  return true ;
+}
+ 
+
+LogProb alignmodel::getValue(Vector<WordIndex>& align) const
+{
+  const LogProb zero = 0.0 ;
+  hash_map<Vector<WordIndex>, LogProb, hashmyalignment, equal_to_myalignment >::const_iterator i;
+  i = a.find(align);
+  if(i == a.end())
+    return zero;
+  else
+    return (*i).second;
+}
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/AlignTables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/AlignTables.h
@ -0,0 +1,124 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef _aligntables_h
+#define _aligntables_h 1
+
+#include "defs.h"
+ 
+
+#include <cassert>
+ 
+#include <iostream>
+#include <algorithm>
+#include <functional>
+#include <map>
+#include <set>
+//#include <vector>
+#include "Vector.h"
+#include <utility>
+#if __GNUC__>2
+#include <ext/hash_map>
+using __gnu_cxx::hash_map;
+#else
+#include <hash_map>
+#endif
+#include <cmath>
+#include <fstream>
+#include "transpair_model1.h"
+
+
+/* ----------------- Class Defintions for hashmyalignment --------------------
+   Objective: This class is used to define a hash mapping function to map
+   an alignment (defined as a vector of integers) into a hash key
+ ----------------------------------------------------------------------------*/
+
+class hashmyalignment : public unary_function< Vector<WordIndex>, size_t >
+{
+public:
+  size_t operator() (const Vector<WordIndex>& key) const
+    // to define the mapping function. it takes an alignment (a vector of
+    // integers) and it returns an integer value (hash key). 
+    {
+      WordIndex j ;
+      size_t s  ;
+      size_t key_sum = 0 ;
+      //      logmsg << "For alignment:" ;
+      for (j = 1 ; j < key.size() ; j++){
+	//	logmsg << " " << key[j] ;
+	key_sum += (size_t) (int) pow(double(key[j]), double((j % 6)+1));
+      }
+      //      logmsg << " , Key value was : " <<  key_sum;
+      s = key_sum % 1000000 ;      
+      //      logmsg << " h(k) = " << s << endl ;
+      return(s);
+    }
+};
+
+class equal_to_myalignment{
+  // returns true if two alignments are the same (two vectors have same enties)
+public:
+  bool operator()(const Vector<WordIndex> t1, 
+		  const Vector<WordIndex> t2) const
+    {WordIndex j ;
+    if (t1.size() != t2.size())
+      return(false);
+    for (j = 1 ; j < t1.size() ; j++)
+      if (t1[j] != t2[j])
+	return(false);
+    return(true);
+    }
+    
+};
+
+/* ---------------- End of Class Defnition for hashmyalignment --------------*/
+
+
+/* ------------------ Class Defintions for alignmodel -----------------------
+ Class Name: alignmodel
+ Objective: Alignments neighborhhoods (collection of alignments) are stored in
+ a hash table (for easy lookup). Each alignment vector is mapped into a hash 
+ key using the operator defined above.
+ *--------------------------------------------------------------------------*/
+
+class alignmodel{
+private:
+  hash_map<Vector<WordIndex>, LogProb, hashmyalignment, equal_to_myalignment > a;
+private:
+  //  void erase(Vector<WordIndex>&);
+public:
+
+  // methods;
+
+  inline hash_map<Vector<WordIndex>, LogProb, hashmyalignment, equal_to_myalignment >::iterator begin(void){return a.begin();} // begining of hash
+  inline hash_map<Vector<WordIndex>, LogProb, hashmyalignment, equal_to_myalignment >::iterator end(void){return a.end();} // end of hash
+  inline const hash_map<Vector<WordIndex>, LogProb, hashmyalignment, equal_to_myalignment >& getHash() const {return a;}; // reference to hash table
+  bool insert(Vector<WordIndex>&, LogProb val=0.0); // add a alignmnet
+ //  void setValue(Vector<WordIndex>&, LogProb val); // not needed
+  LogProb getValue(Vector<WordIndex>&)const; // retrieve prob. of alignment
+  inline void clear(void){ a.clear();}; // clear hash table 
+  //  void printTable(const char* filename);
+  inline void resize(WordIndex n) {a.resize(n);}; // resize table
+
+};
+
+/* -------------- End of alignmode Class Definitions ------------------------*/
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Array.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Array.h
@ -0,0 +1,5 @@
+#ifndef GIZA_ARRAY_H_DEFINED
+#define GIZA_ARRAY_H_DEFINED
+#include "Vector.h"
+#define Array Vector
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Array2.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Array2.h
@ -0,0 +1,126 @@
+/*
+
+ EGYPT Toolkit for Statistical Machine Translation
+ Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful, 
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+ USA.
+
+ */
+/*--
+ Array2: Implementation of a twodimensional checked array allowing for
+ a specified underlieing one-dimensional data-structure.
+
+ Franz Josef Och (30/07/99)
+ --*/
+#ifndef CLASS_Array2_DEFINED
+#define CLASS_Array2_DEFINED
+
+#include "mystl.h"
+#include <string>
+#include <vector>
+
+template<class T, class Y=vector<T> > class Array2 {
+public:
+	Y p;
+	//  short h1, h2;
+	unsigned int h1, h2;
+public:
+	Array2(unsigned int _h1, unsigned int _h2) :
+		p(_h1*_h2), h1(_h1), h2(_h2) {
+	}
+	Array2(unsigned int _h1, unsigned int _h2, const T&_init) :
+		p(_h1*_h2, _init), h1(_h1), h2(_h2) {
+	}
+	Array2() :
+		h1(0), h2(0) {
+	}
+	inline T &operator()(unsigned int i, unsigned int j) {
+		assert(i<h1);
+		assert(j<h2);
+		return p[i*h2+j];
+	}
+	inline const T&operator()(unsigned int i, unsigned int j) const {
+		assert(i<h1);
+		assert(j<h2);
+		return p[i*h2+j];
+	}
+	inline T get(unsigned int i, unsigned int j) {
+		assert(i<h1);
+		assert(j<h2);
+		return p[i*h2+j];
+	}
+	inline void set(unsigned int i, unsigned int j, T x) {
+		assert(i<h1);
+		assert(j<h2);
+		p[i*h2+j]=x;
+	}
+	inline const T get(unsigned int i, unsigned int j) const {
+		assert(i<h1);
+		assert(j<h2);
+		return p[i*h2+j];
+	}
+	inline unsigned int getLen1() const {
+		return h1;
+	}
+	inline unsigned int getLen2() const {
+		return h2;
+	}
+
+	inline T*begin() {
+		if (h1==0||h2==0)
+			return 0;
+		return &(p[0]);
+	}
+	inline T*end() {
+		if (h1==0||h2==0)
+			return 0;
+		return &(p[0])+p.size();
+	}
+
+	inline const T*begin() const {
+		return p.begin();
+	}
+	inline const T*end() const {
+		return p.end();
+	}
+
+	friend ostream&operator<<(ostream&out, const Array2<T, Y>&ar) {
+		for (unsigned int i=0; i<ar.getLen1(); i++) {
+			//out << i << ": ";
+			for (unsigned int j=0; j<ar.getLen2(); j++)
+				out << ar(i, j) << ' ';
+			out << '\n';
+		}
+		return out << endl;
+	}
+	inline void resize(unsigned int a, unsigned int b) {
+		if ( !(a==h1&&b==h2)) {
+			h1=a;
+			h2=b;
+			p.resize(h1*h2);
+		}
+	}
+	inline void resize(unsigned int a, unsigned int b, const T&t) {
+		if ( !(a==h1&&b==h2)) {
+			h1=a;
+			h2=b;
+			p.resize(h1*h2);
+			fill(p.begin(), p.end(), t);
+		}
+	}
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Array4.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Array4.h
@ -0,0 +1,78 @@
+/*
+
+Copyright (C) 2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef AlignmentArray4_h_DEFINED
+#define AlignmentArray4_h_DEFINED
+
+#include "Array2.h"
+template<class T> class Array4
+{
+ private:
+  Array2< Array2<T>* > A;
+  int M;
+  T init;
+ public:
+  Array4(int m,const T&_init)
+    : A(m,m,0),M(m),init(_init) {}
+  ~Array4()
+    {
+      for(int l=0;l<M;++l)
+	for(int m=0;m<M;++m)
+	  delete A(l,m);
+    }
+  const T&operator()(int i, int j, int l, int m)const
+    {
+      if( A(l,m)==0 )
+	return init;
+      else
+	return (*A(l,m))(i,j);
+    }
+  const T&get(int i, int j, int l, int m)const
+    {
+      if( A(l,m)==0 )
+	return init;
+      else
+	return (*A(l,m))(i,j);
+    }
+  T&operator()(int i, int j, int l, int m)
+    {
+      if( A(l,m)==0 )
+	{
+	  A(l,m)=new Array2<T>(max(l+1,m+1),max(l+1,m+1),init);
+	}
+      return (*A(l,m))(i,j);
+    }
+  void clear()
+    {
+      for(int l=0;l<M;++l)
+	for(int m=0;m<M;++m)
+	  if( A(l,m) )
+	    {
+	      Array2<T>&a=*A(l,m);
+	      for(int i=0;i<=l;++i)
+		for(int j=0;j<=m;++j)
+		  a(i,j)=0.0;
+	    }
+    }
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/D4Tables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/D4Tables.h
@ -0,0 +1,772 @@
+/*
+
+ Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+ This file is part of GIZA++ ( extension of GIZA ).
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful, 
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+ USA.
+
+ */
+#ifndef _d4tables_h_define
+#define _d4tables_h_define
+#include <cmath>
+#include "WordClasses.h"
+#include "Globals.h"
+#include "myassert.h"
+#include "syncObj.h"
+extern float d4modelsmooth_factor;
+
+class m4_key {
+public:
+	int deps;
+	int l;
+	int m;
+	int F;
+	int E;
+	int prevj;
+	int vacancies1, vacancies2;
+	m4_key(int _deps, int _l, int _m, int _F, int _E, int _prevj, int _v1,
+			int _v2) :
+		deps(_deps), l(_l), m(_m), F(_F), E(_E), prevj(_prevj),
+				vacancies1(_v1), vacancies2(_v2) {
+	}
+	friend ostream&print1(ostream&out, const m4_key&x, const WordClasses&wce,
+			const WordClasses&wcf) {
+		if (x.deps&DEP_MODEL_l)
+			out << "l: " << x.l<<' ';
+		if (x.deps&DEP_MODEL_m)
+			out << "m: " << x.m<<' ';
+		if (x.deps&DEP_MODEL_F)
+			out << "F: " << wcf.classString(x.F)<< ' ';
+		if (x.deps&DEP_MODEL_E)
+			out << "E: " << wce.classString(x.E)<< ' ';
+		//      if(x.deps&DEP_MODEL_pj)out << "j-1: " << x.prevj<<' ';
+		if (x.vacancies1!=-1)
+			out << "v1: " << x.vacancies1 << ' ';
+		if (x.vacancies2!=-1)
+			out << "v2: " << x.vacancies2 << ' ';
+		return out << '\n';
+	}
+
+	friend ostream&print1_m5(ostream&out, const m4_key&x,
+			const WordClasses&wce, const WordClasses&wcf) {
+		out << ((x.deps&DEP_MODEL_E) ? wce.classString(x.E) : string("0"))
+				<< ' ';
+		out << ((x.deps&DEP_MODEL_F) ? wcf.classString(x.F) : string("0"))
+				<< ' ';
+		out << x.vacancies1 << ' ';
+		out << x.vacancies2 << ' ';
+		return out;
+	}
+
+	friend ostream&printb1(ostream&out, const m4_key&x, const WordClasses&wce,
+			const WordClasses&wcf) {
+		if (x.deps&DEP_MODELb_l)
+			out << "l: " << x.l<<' ';
+		if (x.deps&DEP_MODELb_m)
+			out << "m: " << x.m<<' ';
+		if (x.deps&DEP_MODELb_F)
+			out << "F: " << wcf.classString(x.F) << ' ';
+		if (x.deps&DEP_MODELb_E)
+			out << "E: " << wce.classString(x.E) << ' ';
+		if (x.vacancies1!=-1)
+			out << "v1: " << x.vacancies1 << ' ';
+		if (x.vacancies2!=-1)
+			out << "v2: " << x.vacancies2 << ' ';
+		return out << '\n';
+	}
+	friend ostream&printb1_m5(ostream&out, const m4_key&x,
+			const WordClasses&wcf) {
+		out << "-1 " << ((x.deps&DEP_MODEL_F) ? wcf.classString(x.F)
+				: string("0"))<< ' ';
+		out << x.vacancies1 << ' ';
+		out << x.vacancies2 << ' ';
+		return out;
+	}
+};
+
+class compare1 {
+private:
+	int deps;
+public:
+	compare1(int _deps) :
+		deps(_deps) {
+	}
+	bool operator()(const m4_key&a, const m4_key&b) const {
+		if (deps&DEP_MODEL_l) {
+			if (a.l<b.l)
+				return 1;
+			if (b.l<a.l)
+				return 0;
+		}
+		if (deps&DEP_MODEL_m) {
+			if (a.m<b.m)
+				return 1;
+			if (b.m<a.m)
+				return 0;
+		}
+		if (deps&DEP_MODEL_F) {
+			if (a.F<b.F)
+				return 1;
+			if (b.F<a.F)
+				return 0;
+		}
+		if (deps&DEP_MODEL_E) {
+			if (a.E<b.E)
+				return 1;
+			if (b.E<a.E)
+				return 0;
+		}
+		//if(deps&DEP_MODEL_pj){if( a.prevj<b.prevj )return 1;if( b.prevj<a.prevj )return 0;}
+		if (a.vacancies1<b.vacancies1)
+			return 1;
+		if (b.vacancies1<a.vacancies1)
+			return 0;
+		if (a.vacancies2<b.vacancies2)
+			return 1;
+		if (b.vacancies2<a.vacancies2)
+			return 0;
+		return 0;
+	}
+};
+
+class compareb1 {
+private:
+	int deps;
+public:
+	compareb1(int _deps) :
+		deps(_deps) {
+	}
+	bool operator()(const m4_key&a, const m4_key&b) const {
+		if (deps&DEP_MODELb_l) {
+			if (a.l<b.l)
+				return 1;
+			if (b.l<a.l)
+				return 0;
+		}
+		if (deps&DEP_MODELb_m) {
+			if (a.m<b.m)
+				return 1;
+			if (b.m<a.m)
+				return 0;
+		}
+		if (deps&DEP_MODELb_F) {
+			if (a.F<b.F)
+				return 1;
+			if (b.F<a.F)
+				return 0;
+		}
+		if (deps&DEP_MODELb_E) {
+			if (a.E<b.E)
+				return 1;
+			if (b.E<a.E)
+				return 0;
+		}
+		//if(deps&DEP_MODELb_pj){if( a.prevJ<b.prevJ )return 1;if( b.prevJ<a.prevJ )return 0;}
+		if (a.vacancies1<b.vacancies1)
+			return 1;
+		if (b.vacancies1<a.vacancies1)
+			return 0;
+		if (a.vacancies2<b.vacancies2)
+			return 1;
+		if (b.vacancies2<a.vacancies2)
+			return 0;
+		return 0;
+	}
+};
+
+inline void tokenize(const string&in, Vector<string>&out) {
+	string s;
+	istrstream l(in.c_str());
+	while (l>>s)
+		out.push_back(s);
+}
+
+class d4model {
+public:
+	typedef Vector<pair<COUNT,PROB> > Vpff;
+	map<m4_key,Vpff,compare1 > D1;
+	map<m4_key,Vpff,compareb1> Db1;
+	PositionIndex msl;
+	WordClasses* ewordclasses;
+	WordClasses* fwordclasses;
+	template<class MAPPER> void makeWordClasses(const MAPPER&m1,
+			const MAPPER&m2, string efile, string ffile, const vcbList& elist,
+	    const vcbList& flist) {
+		ifstream estrm(efile.c_str()), fstrm(ffile.c_str());
+		if ( !estrm) {
+			cerr << "ERROR: can not read " << efile << endl;
+		} else
+			ewordclasses->read(estrm, m1,elist);
+		if ( !fstrm)
+			cerr << "ERROR: can not read " << ffile << endl;
+		else
+			fwordclasses->read(fstrm, m2,flist);
+	}
+	d4model(PositionIndex _msl, WordClasses& e, WordClasses& f) :
+		D1(compare1(M4_Dependencies)), Db1(compareb1(M4_Dependencies)),
+				msl(_msl),ewordclasses(&e),fwordclasses(&f) {
+	}
+	
+protected:
+	inline COUNT&getCountRef_first(WordIndex j, WordIndex j_cp, int E, int F, int l,
+			int m) {
+		assert(j>=1);
+		m4_key key(M4_Dependencies, l, m, F, E, j_cp, -1, -1);
+		map<m4_key,Vpff,compare1 >::iterator p=D1.find(key);
+		if (p==D1.end())
+			p=D1.insert(make_pair(key,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+		assert(p!=D1.end());
+		return (p->second)[j-j_cp+msl].first;
+	};
+
+	inline COUNT&getCountRef_bigger(WordIndex j, WordIndex j_prev, int E, int F,
+			int l, int m) {
+		assert(j>=1);
+		assert(j_prev>=1);
+		m4_key key(M4_Dependencies, l, m, F, E, j_prev, -1, -1);
+		map<m4_key,Vpff,compareb1 >::iterator p=Db1.find(key);
+		if (p==Db1.end())
+			p=Db1.insert(make_pair(key,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+		assert(p!=Db1.end());
+		return (p->second)[j-j_prev+msl].first;
+	};
+	Mutex lock_f,lock_b;
+public:
+	inline void augCountRef_first(WordIndex j, WordIndex j_cp, int E, int F, int l,
+			int m, const COUNT& v){
+		lock_f.lock();
+		getCountRef_first(j,j_cp,E,F,l,m)+=v;
+		lock_f.unlock();
+	}
+	
+	inline void augCountRef_bigger(WordIndex j, WordIndex j_prev, int E, int F,
+				int l, int m, const COUNT& v){
+		lock_b.lock();
+		getCountRef_bigger(j,j_prev,E,F,l,m)+=v;
+		lock_b.unlock();
+	}
+	
+	
+
+	void merge(d4model &d) {
+		map<m4_key,Vpff,compare1 >::iterator it;
+		for (it = d.D1.begin(); it!=d.D1.end(); it++) {
+			map<m4_key,Vpff,compare1 >::iterator p=D1.find(it->first);
+			if (p==D1.end())
+				p=D1.insert(make_pair(it->first,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+			int i;
+			for (i=0; i<it->second.size(); i++) {
+				p->second[i].second+=it->second[i].second;
+			}
+		}
+		for (it = d.Db1.begin(); it!=d.Db1.end(); it++) {
+			map<m4_key,Vpff,compare1 >::iterator p=Db1.find(it->first);
+			if (p==Db1.end())
+				p=Db1.insert(make_pair(it->first,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+			int i;
+			for (i=0; i<it->second.size(); i++) {
+				p->second[i].second+=it->second[i].second;
+			}
+		}
+	}
+
+	bool augCount(const char* fD1, const char* fDb) {
+		ifstream ifsd(fD1);
+		int deps;
+		int l;
+		int m;
+		int F;
+		int E;
+		int prevj;
+		int vacancies1, vacancies2;
+		int len;
+		double count;
+		if (!ifsd) {
+			cerr << "Failed in " << fD1 << endl;
+			return false;
+		}
+		{
+			while (ifsd >> deps >> l >> m >>F >> E >> prevj >> vacancies1
+					>>vacancies2>>len) {
+				m4_key key(M4_Dependencies, l, m, F, E, prevj, vacancies1,
+						vacancies2);
+				map<m4_key,Vpff,compare1 >::iterator p=D1.find(key);
+				if (p==D1.end())
+					p=D1.insert(make_pair(key,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+				assert(p!=D1.end());
+				int i;
+				for (i=0; i<len; i++) {
+					ifsd >> count;
+					p->second[i].first+=count;
+				}
+
+			}
+		}
+		ifstream ifsd1(fDb);
+		if (!ifsd1) {
+			cerr << "Failed in " << fDb << endl;
+			return false;
+		}
+		{
+			while (ifsd1 >> deps >> l >> m >>F >> E >> prevj >> vacancies1
+					>>vacancies2>>len) {
+				m4_key key(M4_Dependencies, l, m, F, E, prevj, vacancies1,
+						vacancies2);
+				map<m4_key,Vpff,compareb1 >::iterator p=Db1.find(key);
+				if (p==Db1.end())
+					p=Db1.insert(make_pair(key,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+				assert(p!=D1.end());
+				int i;
+				for (i=0; i<len; i++) {
+					ifsd1 >> count;
+					p->second[i].first+=count;
+				}
+
+			}
+		}
+		return true;
+	}
+
+   bool readProbTable(const char* fD1, const char* fDb){
+        ifstream ifsd(fD1);
+        int deps;
+        int l;
+        int m;
+        int F;
+        int E;
+        int prevj;
+        int vacancies1,vacancies2;
+        int len;
+        double count;
+        if(!ifsd){
+            cerr << "Failed in " << fD1 << endl;
+            return false;
+        }
+        {
+            while(ifsd >> deps >> l >> m >>F >> E >> prevj >> vacancies1>>vacancies2>>len){
+                m4_key key(M4_Dependencies,l,m,F,E,prevj,vacancies1,vacancies2);
+                map<m4_key,Vpff,compare1 >::iterator p=D1.find(key);
+                if(p==D1.end())p=D1.insert(make_pair(key,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+                assert(p!=D1.end());
+                int i;
+                for(i=0;i<len;i++){
+                    ifsd >> count;
+                    p->second[i].second=count;
+                }
+                
+            }
+        }
+        ifstream ifsd1(fDb);
+        if(!ifsd1){
+            cerr << "Failed in " << fDb << endl;
+            return false;
+        }
+        {
+            while(ifsd1 >> deps >> l >> m >>F >> E >> prevj >> vacancies1>>vacancies2>>len){
+                m4_key key(M4_Dependencies,l,m,F,E,prevj,vacancies1,vacancies2);
+                map<m4_key,Vpff,compareb1 >::iterator p=Db1.find(key);
+                if(p==Db1.end())p=Db1.insert(make_pair(key,Vpff(msl*2+1,pair<COUNT,PROB>(0.0,0.0)))).first;
+                assert(p!=D1.end());
+                int i;
+                for(i=0;i<len;i++){
+                    ifsd1 >> count;
+                    p->second[i].second=count;
+                }
+                
+            }
+        }
+        return true;
+    }
+    
+
+	bool printProbTable(const char* fD1, const char* fDb) {
+		ofstream ofsd(fD1);
+		if (!ofsd.is_open()) {
+			return false;
+		}
+		{
+			map<m4_key,Vpff,compare1 >::iterator it;
+			for (it = D1.begin(); it!=D1.end(); it++) {
+				ofsd << it->first.deps << " " << it->first.l << " "
+						<< it->first.m << " " << it->first.F << " "
+						<< it->first.E << " " << it->first.prevj << " "
+						<< it->first.vacancies1 << " " << it->first.vacancies2
+						<< " " << it->second.size() << " ";
+				int i;
+				for (i=0; i<it->second.size(); i++) {
+					ofsd << it->second[i].second << " ";
+				}
+				ofsd << endl;
+			}
+
+		}
+
+		ofstream ofsdb(fDb);
+		if (!ofsdb.is_open()) {
+			return false;
+		}
+
+		map<m4_key,Vpff,compareb1 >::iterator it;
+		for (it = Db1.begin(); it!=Db1.end(); it++) {
+			ofsdb << it->first.deps << " " << it->first.l << " " << it->first.m
+					<< " " << it->first.F << " " << it->first.E << " "
+					<< it->first.prevj << " " << it->first.vacancies1 << " "
+					<< it->first.vacancies2 << " " << it->second.size()<< endl;
+			int i;
+			for (i=0; i<it->second.size(); i++) {
+				ofsdb << it->second[i].second << " ";
+			}
+			ofsdb << endl;
+		}
+		return true;
+	}
+
+    bool dumpCount(const char* fD1, const char* fDb){
+        ofstream ofsd(fD1);
+        if(!ofsd.is_open()){
+            return false;
+        }
+        {
+            map<m4_key,Vpff,compare1 >::iterator it;
+            for(it = D1.begin(); it!=D1.end();it++){
+                ofsd << it->first.deps << " " 
+                  << it->first.l << " " 
+                  << it->first.m << " "
+                  << it->first.F << " "
+                  << it->first.E << " "
+                  << it->first.prevj << " "
+                  << it->first.vacancies1 << " "
+                  << it->first.vacancies2 << " "
+                  << it->second.size() << " ";
+                int i;
+                for(i=0;i<it->second.size();i++){
+                    ofsd << it->second[i].first << " ";
+                }
+                ofsd << endl;
+            }
+            
+        }
+        
+        ofstream ofsdb(fDb);
+        if(!ofsdb.is_open()){
+            return false;
+        }
+        
+        map<m4_key,Vpff,compareb1 >::iterator it;
+        for(it = Db1.begin(); it!=Db1.end();it++){
+            ofsdb << it->first.deps << " " 
+                  << it->first.l << " " 
+                  << it->first.m << " "
+                  << it->first.F << " "
+                  << it->first.E << " "
+                  << it->first.prevj << " "
+                  << it->first.vacancies1 << " "
+                  << it->first.vacancies2 << " "
+                  << it->second.size()<< endl;
+            int i;
+            for(i=0;i<it->second.size();i++){
+                ofsdb << it->second[i].first << " ";
+            }
+            ofsdb << endl;            
+        }
+        return true;
+    }
+	map<m4_key,Vpff,compare1 >::const_iterator getProb_first_iterator(int E,
+			int F, int l, int m) const {
+		return D1.find(m4_key(M4_Dependencies, l, m, F, E, 0, -1, -1));
+	}
+	PROB getProb_first_withiterator(WordIndex j, WordIndex j_cp, int m,
+			const map<m4_key,Vpff,compare1 >::const_iterator& p) const {
+		assert(j>=1);
+		//assert(j_cp>=0);
+		assert(j<=msl);
+		assert(j_cp<=msl);
+		if (p==D1.end()) {
+			return PROB_SMOOTH;
+		} else {
+			massert((p->second)[j-j_cp+msl].second<=1.0);
+			return max(PROB_SMOOTH, d4modelsmooth_factor/(2*m-1)+(1
+					-d4modelsmooth_factor)*(p->second)[j-j_cp+msl].second);
+		}
+	}
+
+	PROB getProb_first(WordIndex j, WordIndex j_cp, int E, int F, int l, int m) const {
+		assert(j>=1);
+		//assert(j_cp>=0);
+		assert(j<=msl);
+		assert(j_cp<=msl);
+		m4_key key(M4_Dependencies, l, m, F, E, j_cp, -1, -1);
+		map<m4_key,Vpff,compare1 >::const_iterator p=D1.find(key);
+		if (p==D1.end()) {
+			return PROB_SMOOTH;
+		} else {
+			massert((p->second)[j-j_cp+msl].second<=1.0);
+			return max(PROB_SMOOTH, d4modelsmooth_factor/(2*m-1)+(1
+					-d4modelsmooth_factor)*(p->second)[j-j_cp+msl].second);
+		}
+	}
+	map<m4_key,Vpff,compareb1 >::const_iterator getProb_bigger_iterator(int E,
+			int F, int l, int m) const {
+		return Db1.find(m4_key(M4_Dependencies, l, m, F, E, 0, -1, -1));
+	}
+	PROB getProb_bigger_withiterator(WordIndex j, WordIndex j_prev, int m,
+			const map<m4_key,Vpff,compareb1 >::const_iterator&p) const {
+		massert(j>=1);
+		massert(j_prev>=1);
+		massert(j>j_prev);
+		massert(j<=msl);
+		massert(j_prev<=msl);
+		if (p==Db1.end()) {
+			return PROB_SMOOTH;
+		} else {
+			massert((p->second)[j-j_prev+msl].second<=1.0 );
+			return max(PROB_SMOOTH, d4modelsmooth_factor/(m-1)+(1
+					-d4modelsmooth_factor)*(p->second)[j-j_prev+msl].second);
+		}
+	}
+
+	PROB getProb_bigger(WordIndex j, WordIndex j_prev, int E, int F, int l,
+			int m) const {
+		massert(j>=1);
+		massert(j_prev>=1);
+		massert(j>j_prev);
+		massert(j<=msl);
+		massert(j_prev<=msl);
+		m4_key key(M4_Dependencies, l, m, F, E, j_prev, -1, -1);
+		map<m4_key,Vpff,compareb1 >::const_iterator p=Db1.find(key);
+		if (p==Db1.end()) {
+			return PROB_SMOOTH;
+		} else {
+			massert((p->second)[j-j_prev+msl].second<=1.0 );
+			return max(PROB_SMOOTH, d4modelsmooth_factor/(m-1)+(1
+					-d4modelsmooth_factor)*(p->second)[j-j_prev+msl].second);
+		}
+	}
+
+	void normalizeTable() {
+		int nParams=0;
+		for (map<m4_key,Vpff,compare1 >::iterator i=D1.begin(); i!=D1.end(); ++i) {
+			Vpff&d1=i->second;
+			double sum=0.0;
+			for (PositionIndex i=0; i<d1.size(); i++)
+				sum+=d1[i].first;
+			for (PositionIndex i=0; i<d1.size(); i++) {
+				d1[i].second=sum ? (d1[i].first/sum) : (1.0/d1.size());
+				nParams++;
+			}
+		}
+		for (map<m4_key,Vpff,compareb1 >::iterator i=Db1.begin(); i!=Db1.end(); ++i) {
+			Vpff&db1=i->second;
+			double sum=0.0;
+			for (PositionIndex i=0; i<db1.size(); i++)
+				sum+=db1[i].first;
+			for (PositionIndex i=0; i<db1.size(); i++) {
+				db1[i].second=sum ? (db1[i].first/sum) : (1.0/db1.size());
+				nParams++;
+			}
+		}
+		cout << "D4 table contains " << nParams << " parameters.\n";
+	}
+
+	void clear() {
+		for (map<m4_key,Vpff,compare1 >::iterator i=D1.begin(); i!=D1.end(); ++i) {
+			Vpff&d1=i->second;
+			for (PositionIndex i=0; i<d1.size(); i++)
+				d1[i].first=0.0;
+		}
+		for (map<m4_key,Vpff,compareb1 >::iterator i=Db1.begin(); i!=Db1.end(); ++i) {
+			Vpff&db1=i->second;
+			for (PositionIndex i=0; i<db1.size(); i++)
+				db1[i].first=0.0;
+		}
+	}
+
+	/*void printProbTable(const char*fname1,const char*fname2)
+	 {
+	 ofstream out(fname1);
+	 double ssum=0.0;
+	 out << "# Translation tables for Model 4 .\n";
+	 out << "# Table for head of cept.\n";
+	 for(map<m4_key,Vpff,compare1 >::const_iterator i=D1.begin();i!=D1.end();++i){
+	 const Vpff&d1=i->second;
+	 double sum=0.0;
+	 for(PositionIndex ii=0;ii<d1.size();ii++)sum+=d1[ii].first;
+	 if ( sum ){
+	 print1(out,i->first,ewordclasses,fwordclasses);
+	 out << "SUM: " << sum << ' '<< '\n';
+	 for(unsigned ii=0;ii<d1.size();ii++)
+	 if( d1[ii].first )
+	 out << (int)(ii)-(int)(msl) << ' ' << d1[ii].first << '\n';
+	 out << endl;
+	 }
+	 ssum+=sum;
+	 }
+	 out << "# Table for non-head of cept.\n";
+	 for(map<m4_key,Vpff,compareb1 >::const_iterator i=Db1.begin();i!=Db1.end();++i)
+	 {
+	 const Vpff&db1=i->second;
+	 double sum=0.0;
+	 for(PositionIndex ii=0;ii<db1.size();++ii)sum+=db1[ii].first;
+	 if( sum ){
+	 printb1(out,i->first,ewordclasses,fwordclasses);
+	 out << "SUM: " << sum << ' '<<'\n';
+	 for(unsigned ii=0;ii<db1.size();ii++)
+	 if( db1[ii].first )
+	 {
+	 out << (int)(ii)-(int)(msl) << ' ' << db1[ii].first << '\n';
+	 }
+	 out << endl;
+	 }
+	 ssum+=sum;
+	 }
+	 out << endl << "FULL-SUM: " << ssum << endl;
+	 if( M4_Dependencies==76 ){
+	 ofstream out2(fname2);
+	 for(map<m4_key,Vpff,compare1 >::const_iterator i=D1.begin();i!=D1.end();++i)
+	 {
+	 const Vpff&d1=i->second;
+	 for(unsigned ii=0;ii<d1.size();ii++)
+	 if( d1[ii].first )
+	 out2 << ewordclasses.classString(i->first.E) << ' ' << fwordclasses.classString(i->first.F) << ' ' << (int)(ii)-(int)(msl) << ' ' << d1[ii].second << '\n';
+	 }
+	 for(map<m4_key,Vpff,compareb1 >::const_iterator i=Db1.begin();i!=Db1.end();++i) {
+	 const Vpff&db1=i->second;
+	 for(unsigned ii=0;ii<db1.size();ii++)
+	 if( db1[ii].first )
+	 out2 << -1 << ' ' << fwordclasses.classString(i->first.F) << ' ' << (int)(ii)-(int)(msl) << ' ' << db1[ii].second << '\n';
+	 }
+	 }
+	 }*/
+
+	bool readProbTable(const char *fname) {
+		cerr << "Reading D4Tables from " << fname << endl;
+		ifstream file(fname);
+		string line;
+		do {
+			getline(file, line);
+		} while (line.length()&&line[0]=='#');
+
+		do {
+			while (line.length()==0)
+				getline(file, line);
+			if (line[0]=='#')
+				break;
+			Vector<string> linestr;
+			tokenize(line, linestr);
+			m4_key k(M4_Dependencies, 0, 0, 0, 0, 0, -1, -1);
+			for (unsigned int i=0; i<linestr.size(); i+=2) {
+				if (linestr[i]=="l:") {
+					k.l=atoi(linestr[i+1].c_str());
+					iassert(M4_Dependencies&DEP_MODEL_l);
+				}
+				if (linestr[i]=="m:") {
+					k.m=atoi(linestr[i+1].c_str());
+					iassert(M4_Dependencies&DEP_MODEL_m);
+				}
+				if (linestr[i]=="F:") {
+					k.F=(*fwordclasses)(linestr[i+1]);
+					iassert(M4_Dependencies&DEP_MODEL_F);
+				}
+				if (linestr[i]=="E:") {
+					k.E=(*ewordclasses)(linestr[i+1]);
+					iassert(M4_Dependencies&DEP_MODEL_E);
+				}
+				//if( linestr[i]=="j-1:" ){k.prevj=atoi(linestr[i+1].c_str());iassert(M4_Dependencies&DEP_MODEL_pj);}
+			}
+			string str;
+			double sum;
+			file >> str >> sum;
+			iassert(str=="SUM:");
+			if (str!="SUM:")
+				cerr << "ERROR: string is " << str << " and not sum " << endl;
+
+			do {
+				int value;
+				double count;
+				getline(file, line);
+				istrstream twonumbers(line.c_str());
+				if (twonumbers >> value >> count) {
+					if (D1.count(k)==0)
+						D1.insert(make_pair(k, Vpff(msl*2+1, pair<COUNT, PROB>(
+								0.0, 0.0))));
+					D1[k][value+msl]=make_pair(count, count/sum);
+				}
+			} while (line.length());
+		} while (file);
+		do {
+			getline(file, line);
+		} while (line.length()&&line[0]=='#');
+		do {
+			while (line.length()==0)
+				getline(file, line);
+			if (line[0]=='#')
+				break;
+			Vector<string> linestr;
+			tokenize(line, linestr);
+			m4_key k(M4_Dependencies, 0, 0, 0, 0, 0, -1, -1);
+			bool sumRead=0;
+			for (unsigned int i=0; i<linestr.size(); i+=2) {
+				if (linestr[i]=="l:") {
+					k.l=atoi(linestr[i+1].c_str());
+					iassert(M4_Dependencies&DEP_MODELb_l);
+				} else if (linestr[i]=="m:") {
+					k.m=atoi(linestr[i+1].c_str());
+					iassert(M4_Dependencies&DEP_MODELb_m);
+				} else if (linestr[i]=="F:") {
+					k.F=(*fwordclasses)(linestr[i+1]);
+					iassert(M4_Dependencies&DEP_MODELb_F);
+				} else if (linestr[i]=="E:") {
+					k.E=(*ewordclasses)(linestr[i+1]);
+					iassert(M4_Dependencies&DEP_MODELb_E);
+				} else if (linestr[i]=="SUM:") {
+					cerr << "Warning: obviously no dependency.\n";
+					sumRead=1;
+				} else if (linestr[i]=="FULL-SUM:") {
+					break;
+				} else {
+					cerr << "ERROR: error in reading d4 tables: " << linestr[i]
+							<< ' ' << linestr[i+1] << endl;
+				}
+			}
+			string str;
+			double sum;
+			if (sumRead==0)
+				file >> str >> sum;
+			else {
+				str=linestr[0];
+				sum=atof(linestr[1].c_str());
+			}
+			if (str!="SUM:")
+				cerr << "ERROR: should read SUM but read " << str << endl;
+			do {
+				int value;
+				double count;
+				getline(file, line);
+				istrstream twonumbers(line.c_str());
+				if (twonumbers >> value >> count) {
+					if (Db1.count(k)==0)
+						Db1.insert(make_pair(k, Vpff(msl*2+1,
+								pair<COUNT, PROB>(0.0, 0.0))));
+					Db1[k][value+msl]=make_pair(count, count/sum);
+				}
+			} while (file&&line.length());
+		} while (file);
+		return 1;
+	}
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/D5Tables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/D5Tables.h
@ -0,0 +1,233 @@
+/*
+
+Copyright (C) 2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef _d5tables_h_define
+#define _d5tables_h_define
+#include <cmath>
+#include "D4Tables.h"
+
+extern float d5modelsmooth_countoffset;
+extern float d5modelsmooth_factor;
+
+#define UNSEENPROB (1.0/vacancies_total)
+
+class d5model
+{
+ private:
+  typedef Vector < pair < COUNT,PROB > >Vpff;
+  map< m4_key,Vpff,compare1 > D1;
+  map< m4_key,Vpff,compareb1 > Db1;
+ public:
+  d4model&d4m;
+  WordClasses* ewordclasses;
+  WordClasses* fwordclasses;
+  template<class MAPPER>
+  void makeWordClasses(const MAPPER&m1,const MAPPER&m2,string efile,string ffile
+      , const vcbList& elist,
+	    const vcbList& flist)
+    {
+      ifstream estrm(efile.c_str()),fstrm(ffile.c_str());
+      if( !estrm )
+	cerr << "ERROR: can not read classes from " << efile << endl;
+      else
+	ewordclasses->read(estrm,m1,elist);
+      if( !fstrm )
+	cerr << "ERROR: can not read classes from " << ffile << endl;
+      else
+	fwordclasses->read(fstrm,m2,flist);
+    }
+  d5model (d4model&_d4m)
+    :D1 (compare1(M5_Dependencies)), Db1 (compareb1(M5_Dependencies)),d4m(_d4m),
+		ewordclasses(_d4m.ewordclasses),fwordclasses(_d4m.fwordclasses)
+    {}
+  COUNT &getCountRef_first (PositionIndex vacancies_j,
+			    PositionIndex vacancies_jp, int F,
+			    PositionIndex l, PositionIndex m,
+			    PositionIndex vacancies_total)
+  {
+    massert(vacancies_j>0);
+    massert(vacancies_total>0);
+    //massert(vacancies_jp<=vacancies_total);
+    massert(vacancies_j <=vacancies_total);
+    massert(vacancies_total<=m);
+    m4_key key(M5_Dependencies,l,m,F,0,0,vacancies_jp,vacancies_total);
+    map<m4_key,Vpff,compare1 >::iterator p=D1.find(key);
+    if(p==D1.end())
+      p=D1.insert(make_pair(key,Vpff(vacancies_total+1,make_pair(0,UNSEENPROB)))).first; // !!! constrain length
+    massert(p!=D1.end());
+    return (p->second)[vacancies_j].first;
+  }
+  COUNT &getCountRef_bigger (PositionIndex vacancies_j,
+			     PositionIndex vacancies_jp, int F,
+			     PositionIndex l, PositionIndex m,
+			     PositionIndex vacancies_total)
+  {
+    massert(vacancies_j>0);
+    massert(vacancies_total>0);
+    massert (vacancies_jp <= vacancies_j);
+    massert (vacancies_j-vacancies_jp <= vacancies_total);
+    m4_key key(M5_Dependencies,l,m,F,0,0,-1,vacancies_total);
+    map<m4_key,Vpff,compareb1 >::iterator p=Db1.find(key);
+    if(p==Db1.end())
+      p=Db1.insert(make_pair(key,Vpff(vacancies_total+1,make_pair(0,UNSEENPROB)))).first; // !!! constrain length
+    massert(p!=Db1.end());
+    return (p->second)[vacancies_j - vacancies_jp].first;
+  }
+  PROB getProb_first (PositionIndex vacancies_j, PositionIndex vacancies_jp,
+		       int F, PositionIndex l, PositionIndex m,
+		       PositionIndex vacancies_total) const
+  {
+    massert(vacancies_j>0);
+    massert(vacancies_total>0);
+    //massert(vacancies_jp<=vacancies_total);
+    massert(vacancies_j <=vacancies_total);
+    massert(vacancies_total<=m);
+    m4_key key(M5_Dependencies,l,m,F,0,0,vacancies_jp,vacancies_total);
+    map<m4_key,Vpff,compare1 >::const_iterator p=D1.find(key);
+    if( p==D1.end() )
+      return UNSEENPROB;
+    else
+      return max(PROB_SMOOTH,d5modelsmooth_factor/(vacancies_total)+(1-d5modelsmooth_factor)*(p->second)[vacancies_j].second);
+  }
+  PROB getProb_bigger (PositionIndex vacancies_j, PositionIndex vacancies_jp,
+			int F, PositionIndex l, PositionIndex m,
+			PositionIndex vacancies_total) const
+  {
+    massert(vacancies_j>0);
+    massert(vacancies_total>0);
+    massert (vacancies_jp <= vacancies_j);
+    massert (vacancies_j-vacancies_jp <= vacancies_total);
+    m4_key key(M5_Dependencies,l,m,F,0,0,-1,vacancies_total);
+    map<m4_key,Vpff,compareb1 >::const_iterator p=Db1.find(key);
+    if(p==Db1.end())
+      return UNSEENPROB;
+    else
+      return max(PROB_SMOOTH,d5modelsmooth_factor/(vacancies_total)+(1-d5modelsmooth_factor)*(p->second)[vacancies_j - vacancies_jp].second);
+  }
+  void normalizeTable ()
+    {
+      int nParams=0;
+      for(map<m4_key,Vpff,compare1 >::iterator i=D1.begin();i!=D1.end();++i)
+	{
+	  Vpff&d1=i->second;
+	  COUNT sum=0.0;
+	  for(PositionIndex i=0;i<d1.size();i++)
+	    sum+=d1[i].first+d5modelsmooth_countoffset;
+	  for(PositionIndex i=0;i<d1.size();i++)
+	    {
+	      d1[i].second=sum?((d1[i].first+d5modelsmooth_countoffset)/sum):(1.0/d1.size());
+	      nParams++;
+	    }
+	}
+      for(map<m4_key,Vpff,compareb1 >::iterator i=Db1.begin();i!=Db1.end();++i)
+	{
+	  Vpff&db1=i->second;
+	  double sum=0.0;
+	  for(PositionIndex i=0;i<db1.size();i++)
+	    sum+=db1[i].first+d5modelsmooth_countoffset;
+	  for(PositionIndex i=0;i<db1.size();i++)
+	    {
+	      db1[i].second=sum?((db1[i].first+d5modelsmooth_countoffset)/sum):(1.0/db1.size());
+	      nParams++;
+	    }
+	}
+      cout << "D5 table contains " << nParams << " parameters.\n";
+    }
+  
+friend ostream&operator<<(ostream&out,d5model&d5m) {  
+    out << "# Translation tables for Model 5 .\n";
+    out << "# Table for head of cept.\n";
+    for(map<m4_key,Vpff,compare1 >::const_iterator i=d5m.D1.begin();i!=d5m.D1.end();++i){
+        const Vpff&d1=i->second;
+        COUNT sum=0.0;
+        for(PositionIndex ii=0;ii<d1.size();ii++)sum+=d1[ii].first;
+        if ( sum ) {
+            for(unsigned ii=0;ii<d1.size();ii++)
+            {
+                print1_m5(out,i->first,*d5m.ewordclasses,*d5m.fwordclasses);
+                out << (int)(ii) << ' ' << d1[ii].second  << ' ' << d1[ii].first << '\n';
+            }
+            out << endl;
+        }
+    }
+    out << "# Table for non-head of cept.\n";
+    for(map<m4_key,Vpff,compareb1 >::const_iterator i=d5m.Db1.begin();i!=d5m.Db1.end();++i){
+        const Vpff&db1=i->second;
+        double sum=0.0;
+        for(PositionIndex ii=0;ii<db1.size();++ii)sum+=db1[ii].first;
+        if( sum ){
+            for(unsigned ii=0;ii<db1.size();ii++){
+                printb1_m5(out,i->first,*d5m.fwordclasses);
+                out << (int)(ii) << ' ' << db1[ii].second << ' ' << db1[ii].first << '\n';
+            }
+            out << endl;
+        }
+    }
+    return out;
+}
+  void readProbTable(const char*x)
+    {
+      ifstream f(x);
+      string l;
+      while(getline(f,l))
+	{
+	  if(l.length()&&l[0]=='#')
+	    continue;
+	  istrstream is(l.c_str());
+	  string E,F;
+	  int v1,v2,ii;
+	  double prob,count;
+	  if(is>>E>>F>>v1>>v2>>ii>>prob>>count)
+	    {
+	      //cerr << "Read: " << E << " " << F << " " << v1 << " " << v2 << " " << prob<< endl;
+	      if( count>0 )
+		if( E=="-1")
+		  getCountRef_bigger(ii,0,(*fwordclasses)(F),1000,1000,v2)+=count;
+		else
+		  getCountRef_first(ii,v1,(*fwordclasses)(F),1000,1000,v2)+=count;
+	    }
+	}
+      normalizeTable();
+      //ofstream of("M5FILE");
+      //of << (*this);
+    }
+  void clear()
+    {
+      for(map<m4_key,Vpff,compare1 >::iterator i=D1.begin();i!=D1.end();++i)
+	{
+	  Vpff&d1=i->second;
+	  for(PositionIndex i=0;i<d1.size();i++)
+	    d1[i].first=0.0;
+	}
+      for(map<m4_key,Vpff,compareb1 >::iterator i=Db1.begin();i!=Db1.end();++i)
+	{
+	  Vpff&db1=i->second;
+	  for(PositionIndex i=0;i<db1.size();i++)
+	    db1[i].first=0.0;
+	}
+    }
+};
+
+#endif
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Dictionary.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Dictionary.cpp
@ -0,0 +1,93 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* Noah A. Smith
+   Dictionary object for dictionary filter in Model 1 training
+
+   Dictionary file must be in order (sorted) by Foreign vocab id, but English
+   vocab ids may be in any order.
+
+   9 August 1999
+*/
+
+#include "Dictionary.h"
+#include <cstring>
+
+Dictionary::Dictionary(const char *filename){
+  if(!strcmp(filename, "")){
+    dead = true;
+    return;
+  }
+  dead = false;
+  cout << "Reading dictionary from:  " << filename << '\n';
+  ifstream dFile(filename);
+  if(!dFile){
+    cerr << "ERROR: Can't open dictionary: " << filename << '\n';
+    exit(1);
+  }
+
+  currindexmin = 0;
+  currindexmax = 0;
+  currval = 0;
+  int p, q;
+  while((dFile >> p >> q)){
+    pairs[0].push_back(p);
+    pairs[1].push_back(q);
+  }
+  cout << "Dictionary read; " << pairs[0].size() << " pairs loaded." << '\n';
+  dFile.close();
+}
+
+
+bool Dictionary::indict(int p, int q){
+  if(dead) return false;
+  if(p == 0 && q == 0) return false;
+  if(currval == p){
+    for(int i = currindexmin; i <= currindexmax; i++)
+      if(pairs[1][i] == q) return true;
+    return false;
+  }
+  else{
+    int begin = 0, end = pairs[0].size() - 1, middle = 0;
+    unsigned int t;
+    bool ret = false;
+    while(begin <= end){
+      middle = begin + ((end - begin) >> 1);
+      if(p < pairs[0][middle]) end = middle - 1;
+      else if(p > pairs[0][middle]) begin = middle + 1;
+      else{
+	break;
+      }
+    }
+    t = middle;
+    while(pairs[0][t] == p )
+      if(pairs[1][t--] == q) ret = true;
+    currindexmin = t + 1;
+    t = middle + 1;
+    while(pairs[0][t] == p && t < pairs[0].size())
+      if(pairs[1][t++] == q) ret = true;
+    currindexmax = t - 1;
+    currval = p;
+    return ret;
+  }
+}
+  
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Dictionary.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Dictionary.h
@ -0,0 +1,48 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* Noah A. Smith
+   Dictionary object for dictionary filter in Model 1 training
+
+   9 August 1999
+*/
+
+#include <iostream>
+#include <fstream>
+
+#include "Vector.h"
+
+#ifndef DICTIONARY_H
+#define DICTIONARY_H
+
+class Dictionary{
+ private:
+  Vector<int> pairs[2];
+  int currval;
+  int currindexmin;
+  int currindexmax;
+  bool dead;
+ public:
+  Dictionary(const char *);
+  bool indict(int, int);
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/FlexArray.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/FlexArray.h
@ -0,0 +1,58 @@
+/*
+
+Copyright (C) 1988,1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef CLASS_FlexArray_defined
+#define CLASS_FlexArray_defined
+#include "Array.h"
+#include <iostream>
+#include <fstream>
+template<class T>
+class FlexArray
+{
+private:
+  Array<T> p;
+  int start,End;
+public:
+  FlexArray(int _start=0,int _end=-1)
+    : p(_end-_start+1),start(_start),End(_end) {}
+  FlexArray(int _start,int _end,const T&init)
+    : p(_end-_start+1,init),start(_start),End(_end) {}
+  T&operator[](int i)
+    {return p[i-start];}
+  const T&operator[](int i)const
+    {return p[i-start];}
+  int low()const{return start;}
+  int high()const{return End;}
+  T*begin(){return conv<double>(p.begin());}
+  T*end(){return conv<double>(p.end());}
+};
+
+template<class T>
+inline ostream&operator<<(ostream&out,const FlexArray<T>&x)
+{
+  for(int i=x.low();i<=x.high();++i)
+    out << i << ':' << x[i] << ';' << ' ';
+  return out;
+}
+
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ForwardBackward.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ForwardBackward.cpp
@ -0,0 +1,240 @@
+/*
+
+ Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+ This file is part of GIZA++ ( extension of GIZA ).
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
+ USA.
+
+ */
+#ifndef NO_TRAINING
+#include "ForwardBackward.h"
+#include "Globals.h"
+#include "myassert.h"
+#include "HMMTables.h"
+#include "mymath.h"
+
+double ForwardBackwardTraining(const HMMNetwork&net, Array<double>&g, Array<
+		Array2<double> >&E) {
+	const int I = net.size1(), J = net.size2(), N = I * J;
+	Array<double> alpha(N, 0), beta(N, 0), sum(J);
+	for (int i = 0; i < I; i++)
+		beta[N - I + i] = net.getBetainit(i);
+	double * cur_beta = conv<double> (beta.begin()) + N - I - 1;
+	for (int j = J - 2; j >= 0; --j)
+		for (int ti = I - 1; ti >= 0; --ti, --cur_beta) {
+			const double *next_beta = conv<double> (beta.begin()) + (j + 1) * I;
+			const double *alprob = &net.outProb(j, ti, 0), *next_node =
+					&net.nodeProb(0, j + 1);
+			for (int ni = 0; ni < I; ++ni, (next_node += J)) {
+				massert(cur_beta<next_beta&& &net.outProb(j,ti,ni)==alprob);
+				massert(next_node == &net.nodeProb(ni,j+1));
+				/*	if( VERB&&(*next_beta)*(*alprob)*(*next_node) )
+				 cout << "B= " << (int)(cur_beta-beta.begin()) << " += " << (*next_beta) << "("
+				 << next_beta-beta.begin() << ") alprob:" << (*alprob) << "  lexprob:" << (*next_node) << endl;*/
+				(*cur_beta) += (*next_beta++) * (*alprob++) * (*next_node);
+			}
+		}
+	for (int i = 0; i < I; i++)
+		alpha[i] = net.getAlphainit(i) * net.nodeProb(i, 0);
+	double* cur_alpha = conv<double> (alpha.begin()) + I;
+	cur_beta = conv<double> (beta.begin()) + I;
+	for (int j = 1; j < J; j++) {
+		Array2<double>&e = E[(E.size() == 1) ? 0 : (j - 1)];
+		if ((E.size() != 1) || j == 1) {
+			e.resize(I, I);
+			fill(e.begin(), e.end(), 0.0);
+		}
+
+		for (int ti = 0; ti < I; ++ti, ++cur_alpha, ++cur_beta) {
+			const double * prev_alpha = conv<double> (alpha.begin()) + I * (j
+					- 1);
+			double *cur_e = &e(ti, 0);
+			double this_node = net.nodeProb(ti, j);
+			const double* alprob = &net.outProb(j - 1, 0, ti);
+			for (int pi = 0; pi < I; ++pi, ++prev_alpha, (alprob += I)) {
+				massert(prev_alpha<cur_alpha&& &net.outProb(j-1,pi,ti)==alprob);
+				massert(&e(ti,pi)==cur_e);
+				const double alpha_increment = *prev_alpha * (*alprob)
+						* this_node;
+				(*cur_alpha) += alpha_increment;
+				(*cur_e++) += alpha_increment * (*cur_beta);
+			}
+		}
+	}
+	g.resize(N);
+	transform(alpha.begin(), alpha.end(), beta.begin(), g.begin(), multiplies<
+			double> ());
+	double bsum = 0, esum = 0, esum2;
+	for (int i = 0; i < I; i++)
+		bsum += beta[i] * net.nodeProb(i, 0) * net.getAlphainit(i);
+	for (unsigned int j = 0; j < (unsigned int) E.size(); j++) {
+		Array2<double>&e = E[j];
+		const double *epe = e.end();
+		for (const double*ep = e.begin(); ep != epe; ++ep)
+			esum += *ep;
+	}
+	if (J > 1)
+		esum2 = esum / (J - 1);
+	else
+		esum2 = 0.0;
+	if (!(esum2 == 0.0 || mfabs(esum2 - bsum) / bsum < 1e-3 * I))
+		cout << "ERROR2: " << esum2 << " " << bsum << " " << esum << net
+				<< endl;
+	double * sumptr = conv<double> (sum.begin());
+	double* ge = conv<double> (g.end());
+	for (double* gp = conv<double> (g.begin()); gp != ge; gp += I) {
+		*sumptr++ = normalize_if_possible(gp, gp + I);
+		if (bsum && !(mfabs((*(sumptr - 1) - bsum) / bsum) < 1e-3 * I))
+			cout << "ERROR: " << *(sumptr - 1) << " " << bsum << " " << mfabs(
+					(*(sumptr - 1) - bsum) / bsum) << ' ' << I << ' ' << J
+					<< endl;
+	}
+	for (unsigned int j = 0; j < (unsigned int) E.size(); j++) {
+		Array2<double>&e = E[j];
+		double* epe = e.end();
+		if (esum)
+			for (double*ep = e.begin(); ep != epe; ++ep)
+				*ep /= esum;
+		else
+			for (double*ep = e.begin(); ep != epe; ++ep)
+				*ep /= 1.0 / (max(I * I, I * I * (J - 1)));
+	}
+	if (sum.size())
+		return sum[0];
+	else
+		return 1.0;
+}
+void HMMViterbi(const HMMNetwork&net, Array<int>&vit) {
+	const int I = net.size1(), J = net.size2();
+	vit.resize(J);
+	Array<double> g;
+	Array<Array2<double> > e(1);
+	ForwardBackwardTraining(net, g, e);
+	for (int j = 0; j < J; j++) {
+		double * begin = conv<double> (g.begin()) + I * j;
+		vit[j] = max_element(begin, begin + I) - begin;
+	}
+}
+void HMMViterbi(const HMMNetwork&net, Array<double>&g, Array<int>&vit) {
+	const int I = net.size1(), J = net.size2();
+	vit.resize(J);
+	for (int j = 0; j < J; j++) {
+		double* begin = conv<double> (g.begin()) + I * j;
+		vit[j] = max_element(begin, begin + I) - begin;
+	}
+}
+
+double HMMRealViterbi(const HMMNetwork&net, Array<int>&vitar, int pegi,
+		int pegj, bool verbose) {
+	const int I = net.size1(), J = net.size2(), N = I * J;
+	Array<double> alpha(N, -1);
+	Array<double*> bp(N, (double*) 0);
+	vitar.resize(J);
+	if (J == 0)
+		return 1.0;
+	for (int i = 0; i < I; i++) {
+		alpha[i] = net.getAlphainit(i) * net.nodeProb(i, 0);
+		if (i > I / 2)
+			alpha[i] = 0; // only first empty word can be chosen
+		bp[i] = 0;
+	}
+	double *cur_alpha = conv<double> (alpha.begin()) + I;
+	double **cur_bp = conv<double*> (bp.begin()) + I;
+	for (int j = 1; j < J; j++) {
+		if (pegj + 1 == j)
+			for (int ti = 0; ti < I; ti++)
+				if ((pegi != -1 && ti != pegi) || (pegi == -1 && ti < I / 2))
+					(cur_alpha - I)[ti] = 0.0;
+		for (int ti = 0; ti < I; ++ti, ++cur_alpha, ++cur_bp) {
+			double* prev_alpha = conv<double> (alpha.begin()) + I * (j - 1);
+			double this_node = net.nodeProb(ti, j);
+			const double *alprob = &net.outProb(j - 1, 0, ti);
+			for (int pi = 0; pi < I; ++pi, ++prev_alpha, (alprob += I)) {
+				massert(prev_alpha<cur_alpha&& &net.outProb(j-1,pi,ti)==alprob);
+				const double alpha_increment = *prev_alpha * (*alprob)
+						* this_node;
+				if (alpha_increment > *cur_alpha) {
+					(*cur_alpha) = alpha_increment;
+					(*cur_bp) = prev_alpha;
+				}
+			}
+		}
+	}
+	for (int i = 0; i < I; i++)
+		alpha[N - I + i] *= net.getBetainit(i);
+	if (pegj == J - 1)
+		for (int ti = 0; ti < I; ti++)
+			if ((pegi != -1 && ti != pegi) || (pegi == -1 && ti < I / 2))
+				(alpha)[N - I + ti] = 0.0;
+
+	int j = J - 1;
+	cur_alpha = conv<double> (alpha.begin()) + j * I;
+	vitar[J - 1] = max_element(cur_alpha, cur_alpha + I) - cur_alpha;
+	double ret = *max_element(cur_alpha, cur_alpha + I);
+	while (bp[vitar[j] + j * I]) {
+		cur_alpha -= I;
+		vitar[j - 1] = bp[vitar[j] + j * I] - cur_alpha;
+		massert(vitar[j-1]<I&&vitar[j-1]>=0);
+		j--;
+	}
+	massert(j==0);
+	if (verbose) {
+		cout << "VERB:PEG: " << pegi << ' ' << pegj << endl;
+		for (int j = 0; j < J; j++)
+			cout << "NP " << net.nodeProb(vitar[j], j) << ' ' << "AP " << ((j
+					== 0) ? net.getAlphainit(vitar[j]) : net.outProb(j - 1,
+					vitar[j - 1], vitar[j])) << " j:" << j << " i:" << vitar[j]
+					<< ";  ";
+		cout << endl;
+	}
+	return ret;
+}
+
+double MaximumTraining(const HMMNetwork&net, Array<double>&g, Array<Array2<
+		double> >&E) {
+	Array<int> vitar;
+	double ret = HMMRealViterbi(net, vitar);
+	const int I = net.size1(), J = net.size2();
+	if (E.size() == 1) {
+		Array2<double>&e = E[0];
+		e.resize(I, I);
+		g.resize(I * J);
+		fill(g.begin(), g.end(), 0.0);
+		fill(e.begin(), e.end(), 0.0);
+		for (int i = 0; i < J; ++i) {
+			g[i * I + vitar[i]] = 1.0;
+			if (i > 0)
+				e(vitar[i], vitar[i - 1])++;
+		}
+	} else {
+		g.resize(I * J);
+		fill(g.begin(), g.end(), 0.0);
+		for (int i = 0; i < J; ++i) {
+			g[i * I + vitar[i]] = 1.0;
+			if (i > 0) {
+				Array2<double>&e = E[i - 1];
+				e.resize(I, I);
+				fill(e.begin(), e.end(), 0.0);
+				e(vitar[i], vitar[i - 1])++;
+			}
+		}
+	}
+	return ret;
+}
+
+#endif
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ForwardBackward.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/ForwardBackward.h
@ -0,0 +1,62 @@
+/*
+
+Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef NO_EM_MARKOF_ZEUGS_DEFINED
+#define NO_EM_MARKOF_ZEUGS_DEFINED
+#ifndef NO_TRAINING
+#include "myassert.h"
+#include "Array.h"
+#include "Array2.h"
+
+class HMMNetwork
+{
+ public:
+  int as,bs;
+  Array2<double> n;
+  Array<Array2<double> > e;
+  Array<double> alphainit;
+  Array<double> betainit;
+  int ab;
+  double finalMultiply;
+  HMMNetwork(int I,int J)
+    : as(I),bs(J),n(as,bs),/*e(as,as,0.0),*/e(0),alphainit(as,1.0/as),betainit(as,1.0),ab(as*bs),finalMultiply(1.0)
+    {}
+  double getAlphainit(int i)const{return alphainit[i];}
+  double getBetainit(int i)const{return betainit[i];}
+  inline int size1()const{return as;}
+  inline int size2()const{return bs;}
+  inline const double&nodeProb(int i,int j)const
+    {return n(i,j);}
+  inline const double&outProb(int j,int i1,int i2)const
+    {/*massert(e[min(int(e.size())-1,j)](i1,i2) );*/ return e[min(int(e.size())-1,j)](i1,i2);}
+  friend ostream&operator<<(ostream&out,const HMMNetwork&x)
+    {
+      return out <<"N: \n"<< x.n << endl << "E: \n" << x.e << "A:\n" << x.alphainit << "B:\n" << x.betainit << endl;
+    }
+};
+double ForwardBackwardTraining(const HMMNetwork&mc,Array<double>&gamma,Array<Array2<double> >&epsilon);
+void HMMViterbi(const HMMNetwork&mc,Array<int>&vit);
+double HMMRealViterbi(const HMMNetwork&net,Array<int>&vit,int pegi=-1,int pegj=-1,bool verbose=0);
+double MaximumTraining(const HMMNetwork&net,Array<double>&g,Array<Array2<double> >&e);
+void HMMViterbi(const HMMNetwork&net,Array<double>&g,Array<int>&vit);
+#endif
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Globals.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Globals.h
@ -0,0 +1,75 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef Globals_asdf_defined
+#define Globals_asdf_defined
+#include <string>
+#include <fstream>
+#include <map>
+#include <syncObj.h>
+#include "defs.h"
+#include "Vector.h"
+
+extern float PROB_SMOOTH,MINCOUNTINCREASE;
+extern bool Verbose, Log, Peg, Transfer, Transfer2to3, useDict ;
+extern string Prefix, LogFilename, OPath, 
+  SourceVocabFilename, TargetVocabFilename, CorpusFilename, TestCorpusFilename, 
+  t_Filename, a_Filename, p0_Filename, d_Filename, n_Filename, dictionary_Filename;
+extern ofstream logmsg ;
+extern Mutex logmsg_lock;
+extern double M5P0,P0 ;
+extern bool NODUMPS, FEWDUMPS  ;
+extern string Usage ;
+extern unsigned int MAX_SENTENCE_LENGTH ;
+extern int PegUntil;
+
+extern short DeficientDistortionForEmptyWord;
+
+extern int M4_Dependencies;
+extern int M5_Dependencies;
+
+extern short OutputInAachenFormat;
+
+#define DEP_MODEL_l 1
+#define DEP_MODEL_m 2
+#define DEP_MODEL_F 4
+#define DEP_MODEL_E 8
+
+#define DEP_MODELb_l 16
+#define DEP_MODELb_m 32
+#define DEP_MODELb_F 64
+#define DEP_MODELb_E 128
+
+#define DEP_SUM 256
+
+class vcbList;
+
+extern vcbList *globeTrainVcbList, *globfTrainVcbList;
+
+extern short PredictionInAlignments;
+extern short SmoothHMM;
+#define VERB Verbose
+
+double ErrorsInAlignment(const map< pair<int,int>,char >&reference,const Vector<WordIndex>&test,int l,int&missing,int&toomuch,int&eventsMissing,int&eventsToomuch,int);
+extern Vector<map< pair<int,int>,char > > ReferenceAlignment;
+void printGIZAPars(ostream&out);
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/HMMTables.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/HMMTables.cpp
@ -0,0 +1,512 @@
+/*
+
+ Copyright (C) 1998,1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+ This file is part of GIZA++ ( extension of GIZA ).
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful, 
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+ USA.
+
+ */
+#include "HMMTables.h"
+#include <fstream>
+#include <sstream>
+#include "Globals.h"
+#include "Parameter.h"
+
+template<class CLS, class MAPPERCLASSTOSTRING> void HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::writeJumps(ostream&out) const {
+	double ssum=0.0;
+	for (typename map<AlDeps<CLS>,FlexArray<double> >::const_iterator i=
+			alProb.begin(); i!=alProb.end(); ++i) {
+		double sum=0.0;
+		out << "\n\nDistribution for: ";
+		printAlDeps(out, i->first, *mapper1, *mapper2);
+		out << ' ';
+		for (int a=i->second.low(); a<=i->second.high(); ++a)
+			if (i->second[a]) {
+				out << a << ':' << i->second[a] << ';' << ' ';
+				sum+=i->second[a];
+			}
+		out << '\n' << '\n';
+		out << "SUM: " << sum << '\n';
+		ssum+=sum;
+	}
+	out << "FULL-SUM: " << ssum << '\n';
+}
+template<class CLS, class MAPPERCLASSTOSTRING> void HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::readJumps(istream&) {
+}
+template<class CLS, class MAPPERCLASSTOSTRING> double HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::getAlProb(int istrich, int k, int sentLength,
+		int J, CLS w1, CLS w2, int j, int iter) const {
+	massert(k<sentLength&&k>=0);
+	massert(istrich<sentLength&&istrich>=-1);
+	int pos=istrich-k;
+	switch (PredictionInAlignments) {
+	case 0:
+		pos=istrich-k;
+		break;
+	case 1:
+		pos=k;
+		break;
+	case 2:
+		pos=(k*J-j*sentLength);
+		if (pos>0)
+			pos+=J/2;
+		else
+			pos-=J/2;
+		pos/=J;
+		break;
+	default:
+		abort();
+	}
+	lock.lock();
+	typename map<AlDeps<CLS>,FlexArray<double> >::const_iterator p=
+			alProb.find(AlDeps<CLS>(sentLength, istrich, j, w1, w2));
+	if (p!=alProb.end() ) {
+		lock.unlock();
+		return (p->second)[pos];
+	} else {
+		if (iter>0&&iter<5000)
+			cout << "WARNING: Not found: " << ' ' << J << ' ' << sentLength
+					<< '\n';;
+		lock.unlock();
+		return 1.0/(2*sentLength-1);
+	}
+	lock.unlock();
+}
+
+template<class CLS, class MAPPERCLASSTOSTRING> void HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::addAlCount(int istrich, int k, int sentLength,
+		int J, CLS w1, CLS w2, int j, double value, double valuePredicted) {
+	int pos=istrich-k;
+	switch (PredictionInAlignments) {
+	case 0:
+		pos=istrich-k;
+		break;
+	case 1:
+		pos=k;
+		break;
+	case 2:
+		pos=(k*J-j*sentLength);
+		if (pos>0)
+			pos+=J/2;
+		else
+			pos-=J/2;
+		pos/=J;
+		break;
+	default:
+		abort();
+	}
+
+	AlDeps<CLS> deps(AlDeps<CLS>(sentLength, istrich, j, w1, w2));
+
+	{
+		lock.lock();
+		typename map<AlDeps<CLS>,FlexArray<double> >::iterator p=
+				alProb.find(deps);
+		if (p==alProb.end() ) {
+			if ( (CompareAlDeps&1)==0)
+				p
+						=alProb.insert(make_pair(deps,FlexArray<double> (-MAX_SENTENCE_LENGTH,MAX_SENTENCE_LENGTH,0.0))).first;
+			else
+				p=alProb.insert(make_pair(deps,FlexArray<double> (-sentLength,sentLength,0.0))).first;
+		}
+		p->second[pos]+=value;
+		lock.unlock();
+	}
+
+	if (valuePredicted) {
+		lock.lock();
+		typename map<AlDeps<CLS>,FlexArray<double> >::iterator p=
+				alProbPredicted.find(deps);
+		if (p==alProbPredicted.end() ) {
+			if ( (CompareAlDeps&1)==0)
+				p
+						=alProbPredicted.insert(make_pair(deps,FlexArray<double> (-MAX_SENTENCE_LENGTH,MAX_SENTENCE_LENGTH,0.0))).first;
+			else
+				p=alProbPredicted.insert(make_pair(deps,FlexArray<double> (-sentLength,sentLength,0.0))).first;
+		}
+		p->second[pos]+=valuePredicted;
+		lock.unlock();
+	}
+}
+
+template<class CLS, class MAPPERCLASSTOSTRING> 
+pair<Array<double>,Mutex>&HMMTables<CLS,MAPPERCLASSTOSTRING>::doGetAlphaInit(int I)
+{
+	alphalock.lock();
+	if( !init_alpha.count(I) ){
+		init_alpha[I]=pair<Array<double>,Mutex>(Array<double>(I,0),Mutex());
+	}
+	pair<Array<double>,Mutex>& ret  = init_alpha[I];
+	alphalock.unlock();
+	return ret;
+}
+template<class CLS, class MAPPERCLASSTOSTRING> 
+pair<Array<double>,Mutex>&HMMTables<CLS,MAPPERCLASSTOSTRING>::doGetBetaInit(int I)
+{
+	betalock.lock();
+	if( !init_beta.count(I) ){
+		init_beta[I]=pair<Array<double>,Mutex>(Array<double>(I,0),Mutex());
+	}
+	pair<Array<double>,Mutex>& ret = init_beta[I];
+	betalock.unlock();
+	return ret;
+}
+
+template<class CLS, class MAPPERCLASSTOSTRING> bool HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::getAlphaInit(int I, Array<double>&x) const {
+	alphalock.lock();
+	hash_map<int,pair<Array<double>,Mutex> >::const_iterator i=init_alpha.find(I);
+	if (i==init_alpha.end() ){
+		alphalock.unlock();
+		return 0;
+	}
+	else {
+		x=i->second.first;
+		alphalock.unlock();
+		for (unsigned int j=x.size()/2+1; j<x.size(); ++j)
+			// only first empty word can be chosen
+			x[j]=0;
+		return 1;
+	}
+	alphalock.unlock();
+}
+template<class CLS, class MAPPERCLASSTOSTRING> bool HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::getBetaInit(int I, Array<double>&x) const {
+	betalock.lock();
+	hash_map<int,pair<Array<double>,Mutex> >::const_iterator i=init_beta.find(I);
+	if (i==init_beta.end() ){
+		betalock.unlock();
+		return 0;
+	}
+	else {
+		x=i->second.first;
+		betalock.unlock();
+		return 1;
+	}
+	betalock.unlock();
+}
+
+/***********************************
+ By Edward Gao
+ ************************************/
+
+template<class CLS, class MAPPERCLASSTOSTRING> bool HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::writeJumps(const char* alprob,
+		const char* alpredict, const char* alpha, const char* beta) const {
+	if (alprob) {
+		ofstream ofs(alprob);
+		if (!ofs.is_open()) {
+			cerr << "Cannot open file for HMM output " << alprob << endl;
+			return false;
+		}
+		cerr << "Dumping HMM table to " << alprob << endl;
+
+		for (typename map<AlDeps<CLS>,FlexArray<double> >::const_iterator i=
+				alProb.begin(); i!=alProb.end(); ++i) {
+			double sum=0.0;
+			ofs <<i->first.englishSentenceLength << " "
+					<< i->first.classPrevious << " " << i->first.previous
+					<< " " << i->first.j << " " << i->first.Cj <<" "
+					<< i->second.low() <<" " << i->second.high()<< " ";
+			for (int a=i->second.low(); a<=i->second.high(); ++a)
+				if (i->second[a]) {
+					ofs << a << ' ' << i->second[a] << ' ';
+					sum+=i->second[a];
+				}
+			ofs << endl;
+		}
+		ofs.close();
+	}
+	if (alpredict) {
+		ofstream ofs(alpredict);
+		if (!ofs.is_open()) {
+			cerr << "Cannot open file for HMM output " << alpredict << endl;
+			return false;
+		}
+		cerr << "Dumping HMM table to " << alpredict << endl;
+		for (typename map<AlDeps<CLS>,FlexArray<double> >::const_iterator i=
+				alProbPredicted.begin(); i!=alProbPredicted.end(); ++i) {
+			double sum=0.0;
+			ofs << i->first.englishSentenceLength << " "
+					<< i->first.classPrevious << " " << i->first.previous
+					<< " " << i->first.j << " " << i->first.Cj <<" "
+					<< i->second.low() <<" " << i->second.high()<< " ";
+			for (int a=i->second.low(); a<=i->second.high(); ++a)
+				if (i->second[a]) {
+					ofs << a << ' ' << i->second[a] << ' ';
+					sum+=i->second[a];
+				}
+			ofs << endl;
+		}
+		ofs.close();
+	}
+	if (alpha) {
+		ofstream ofs(alpha);
+
+		if (!ofs.is_open()) {
+			cerr << "Cannot open file for HMM output " << alpha << endl;
+			return false;
+		}
+		cerr << "Dumping HMM table to " << alpha << endl;
+		for (typename hash_map<int,pair<Array<double>,Mutex> >::const_iterator i=
+				init_alpha.begin(); i!=init_alpha.end(); i++) {
+			ofs << i->first << " " << i->second.first.size() <<" ";
+			int j;
+			for (j=0; j<i->second.first.size(); j++) {
+				ofs << i->second.first[j] << " ";
+			}
+			ofs<<endl;
+		}
+		ofs.close();
+	}
+	if (beta) {
+		ofstream ofs(beta);
+		if (!ofs.is_open()) {
+			cerr << "Cannot open file for HMM output " << beta << endl;
+			return false;
+		}
+		cerr << "Dumping HMM table to " << beta << endl;
+		for (typename hash_map<int,pair<Array<double>,Mutex>  >::const_iterator i=
+				init_beta.begin(); i!=init_beta.end(); i++) {
+			ofs << i->first << " " << i->second.first.size() << " ";
+			int j;
+			for (j=0; j<i->second.first.size(); j++) {
+				ofs << i->second.first[j] << " ";
+			}
+			ofs << endl;
+		}
+		ofs.close();
+	}
+	return true;
+}
+
+template<class CLS, class MAPPERCLASSTOSTRING> bool HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::readJumps(const char* alprob,
+		const char* alpredict, const char* alpha, const char* beta) {
+	if (alprob) {
+		ifstream ifs(alprob);
+		if (!ifs.is_open()) {
+			cerr << "Cannot open file for HMM input " << alprob << endl;
+			return false;
+		}
+		cerr << "Reading HMM table from " << alprob << endl;
+		string strLine="";
+		bool expect_data = false;
+		while (!ifs.eof()) {
+			strLine = "";
+			getline(ifs, strLine);
+			if (strLine.length()) {
+				stringstream ss(strLine.c_str());
+				AlDeps<CLS> dep;
+				int low, high;
+				ss >> dep.englishSentenceLength >> dep.classPrevious
+						>> dep.previous >> dep.j >> dep.Cj >> low >> high;
+				typename map<AlDeps<CLS>,FlexArray<double> >::iterator p=
+						alProb.find(dep);
+				if (p==alProb.end() ) {
+					p=alProb.insert(make_pair(dep,FlexArray<double> (low,high,0.0))).first;
+				}
+				int pos;
+				double val;
+				while (!ss.eof()) {
+					pos = low-1;
+					val = 0;
+					ss >> pos >> val;
+					if (pos>low-1) {
+						p->second[pos]+=val;
+					}
+				}
+			}
+		}
+	}
+	if (alpredict) {
+		ifstream ifs(alpredict);
+		if (!ifs.is_open()) {
+			cerr << "Cannot open file for HMM input " << alpredict << endl;
+			return false;
+		}
+		cerr << "Reading HMM table from " << alpredict << endl;
+		string strLine="";
+		bool expect_data = false;
+		while (!ifs.eof()) {
+			strLine = "";
+			getline(ifs, strLine);
+			if (strLine.length()) {
+				stringstream ss(strLine.c_str());
+				AlDeps<CLS> dep;
+				int low, high;
+				ss >> dep.englishSentenceLength >> dep.classPrevious
+						>> dep.previous >> dep.j >> dep.Cj >> low >> high;
+				typename map<AlDeps<CLS>,FlexArray<double> >::iterator p=
+						alProbPredicted.find(dep);
+				if (p==alProbPredicted.end() ) {
+					p=alProbPredicted.insert(make_pair(dep,FlexArray<double> (low,high,0.0))).first;
+				}
+				int pos;
+				double val;
+
+				while (!ss.eof()) {
+					pos = low-1;
+					val = 0;
+					ss >> pos >> val;
+					if (pos>low-1) {
+						p->second[pos]+=val;
+					}
+				}
+			}
+		}
+	}
+
+	if (alpha) {
+		ifstream ifs(alpha);
+
+		if (!ifs.is_open()) {
+			cerr << "Cannot open file for HMM input " << alpha << endl;
+			return false;
+		}
+		string strLine="";
+		bool expect_data = false;
+		while (!ifs.eof()) {
+			strLine = "";
+			getline(ifs, strLine);
+			if (strLine.length()) {
+				stringstream ss(strLine.c_str());
+				int id = -1, size = -1;
+				ss >> id >> size;
+				if (id<0||size<0||id!=size) {
+					cerr << "Mismatch in alpha init table!" << endl;
+					return false;
+				}
+				pair<Array<double>, Mutex>&alp = doGetAlphaInit(id);
+				Array<double>& gk = alp.first;
+				int j;
+				double v;
+				alp.second.lock();
+				for (j=0; j<gk.size(); j++) {
+					ss >> v;
+					gk[j]+=v;
+				}
+				alp.second.unlock();
+			}
+		}
+	}
+
+	if (beta) {
+		ifstream ifs(beta);
+
+		if (!ifs.is_open()) {
+			cerr << "Cannot open file for HMM input " << beta << endl;
+			return false;
+		}
+		string strLine="";
+		bool expect_data = false;
+		while (!ifs.eof()) {
+			strLine = "";
+			getline(ifs, strLine);
+			if (strLine.length()) {
+				stringstream ss(strLine.c_str());
+				int id = -1, size = -1;
+				ss >> id >> size;
+				if (id<0||size<0||id!=size) {
+					cerr << "Mismatch in alpha init table!" << endl;
+					return false;
+				}
+				pair<Array<double>, Mutex>&bet1 = doGetBetaInit(id);
+				Array<double>&bet = bet1.first;
+				
+				int j;
+				double v;
+				bet1.second.lock();
+				for (j=0; j<bet.size(); j++) {
+					ss >> v;
+					bet[j]+=v;
+				}
+				bet1.second.unlock();
+			}
+		}
+	}
+
+	return true;
+}
+
+template<class CLS, class MAPPERCLASSTOSTRING> bool HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::merge(HMMTables<CLS,MAPPERCLASSTOSTRING> & ht) {
+
+	for (typename map<AlDeps<CLS>,FlexArray<double> >::const_iterator i=
+			ht.alProb.begin(); i!=ht.alProb.end(); ++i) {
+		typename map<AlDeps<CLS>,FlexArray<double> >::iterator p=
+				alProb.find(i->first);
+		if (p==alProb.end() ) {
+			p=alProb.insert(make_pair(i->first,FlexArray<double> (i->second.low(),i->second.high(),0.0))).first;
+		}
+		for (int a=i->second.low(); a<=i->second.high(); ++a)
+			if (i->second[a]) {
+				p->second[a] += i->second[a];
+			}
+
+	}
+
+	for (typename map<AlDeps<CLS>,FlexArray<double> >::const_iterator i=
+			ht.alProbPredicted.begin(); i!=ht.alProbPredicted.end(); ++i) {
+		typename map<AlDeps<CLS>,FlexArray<double> >::iterator p=
+				alProbPredicted.find(i->first);
+		if (p==alProbPredicted.end() ) {
+			p=alProbPredicted.insert(make_pair(i->first,FlexArray<double> (i->second.low(),i->second.high(),0.0))).first;
+		}
+		for (int a=i->second.low(); a<=i->second.high(); ++a)
+			if (i->second[a]) {
+				p->second[a] += i->second[a];
+			}
+
+	}
+
+	for (typename hash_map<int,pair<Array<double>,Mutex> >::const_iterator i=
+			ht.init_alpha.begin(); i!=ht.init_alpha.end(); i++) {
+		pair<Array<double>,Mutex> alp = doGetAlphaInit(i->first);
+		int j;
+		double v;
+		for (j=0; j<alp.first.size(); j++) {
+			alp.first[j]+=i->second.first[j];
+		}
+	}
+	for (typename hash_map<int,pair<Array<double>,Mutex> >::const_iterator i=
+			ht.init_beta.begin(); i!=ht.init_beta.end(); i++) {
+		pair<Array<double>,Mutex>&alp = doGetBetaInit(i->first);
+		int j;
+		double v;
+		for (j=0; j<alp.first.size(); j++) {
+			alp.first[j]+=i->second.first[j];
+		}
+	}
+
+	return true;
+
+}
+
+//////////////////////////////////////
+template<class CLS, class MAPPERCLASSTOSTRING> HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::HMMTables(double _probForEmpty,
+		const MAPPERCLASSTOSTRING&m1, const MAPPERCLASSTOSTRING&m2) :
+	probabilityForEmpty(mfabs(_probForEmpty)),
+			updateProbabilityForEmpty(_probForEmpty<0.0), mapper1(&m1),
+			mapper2(&m2) {
+}
+template<class CLS, class MAPPERCLASSTOSTRING> HMMTables<CLS,
+		MAPPERCLASSTOSTRING>::~HMMTables() {
+}
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/HMMTables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/HMMTables.h
@ -0,0 +1,179 @@
+/*
+
+Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef HMM_TABLES_H_ASDF_DEFINED
+#define HMM_TABLES_H_ASDF_DEFINED
+#include "FlexArray.h"
+
+#if __GNUC__>2
+#include <ext/hash_map>
+using __gnu_cxx::hash_map;
+#else
+#include <hash_map>
+#endif
+#include "Array.h"
+#include <map>
+#include "mymath.h"
+#include "syncObj.h"
+
+template<class T>
+T normalize_if_possible(T*a,T*b){
+    T sum=0;
+    for(T*i=a;i!=b;++i)
+        sum+=*i;
+    if( sum )
+        for(T*i=a;i!=b;++i)
+        *i/=sum;
+    else
+        fill(a,b,1.0/(b-a));
+    return sum;
+}
+
+extern short CompareAlDeps;
+template<class CLS>
+class AlDeps{
+public:
+    int englishSentenceLength;
+    CLS classPrevious;
+    int previous;
+    int j;
+    CLS Cj;
+    AlDeps(){};
+    AlDeps(int l,int p=0,int _j=0,CLS s1=0,CLS _Cj=0)
+        : englishSentenceLength(l),classPrevious(s1),previous(p),j(_j),Cj(_Cj)
+    {}
+    friend bool operator<(const AlDeps&x,const AlDeps&y){
+        if( (CompareAlDeps&1) && x.englishSentenceLength<y.englishSentenceLength ) return 1;
+        if( (CompareAlDeps&1) && y.englishSentenceLength<x.englishSentenceLength ) return 0;
+        if( (CompareAlDeps&2) && x.classPrevious<y.classPrevious ) return 1;
+        if( (CompareAlDeps&2) && y.classPrevious<x.classPrevious ) return 0;
+        if( (CompareAlDeps&4) && x.previous<y.previous ) return 1;
+        if( (CompareAlDeps&4) && y.previous<x.previous ) return 0;
+        if( (CompareAlDeps&8) && x.j<y.j ) return 1;
+        if( (CompareAlDeps&8) && y.j<x.j ) return 0;
+        if( (CompareAlDeps&16) && x.Cj<y.Cj ) return 1;
+        if( (CompareAlDeps&16) && y.Cj<x.Cj ) return 0;
+        return 0;
+    }
+    friend bool operator==(const AlDeps&x,const AlDeps&y)
+    { return !( x<y || y<x );  }
+};
+
+template<class CLS>
+class Hash_AlDeps{
+public:
+    unsigned 
+        int 
+        operator()
+        (const AlDeps<CLS>&x)
+        const
+    {
+        unsigned int hash=0;
+        if( (CompareAlDeps&1) ) { hash=hash+x.englishSentenceLength;hash*=31;}
+        if( (CompareAlDeps&2) ) { hash=hash+x.classPrevious;hash*=31;}
+        if( (CompareAlDeps&4) ) { hash=hash+x.previous;hash*=31;}
+        if( (CompareAlDeps&8) ) { hash=hash+x.j;hash*=31;}
+        if( (CompareAlDeps&16) ) { hash=hash+x.Cj;hash*=31;}
+        return hash;
+      
+    }
+};
+
+template<class CLS,class MAPPERCLASSTOSTRING>
+class HMMTables
+{
+	Mutex lock;
+	Mutex alphalock,betalock;
+public:
+    double probabilityForEmpty;  
+    bool updateProbabilityForEmpty;
+    hash_map<int, pair<Array<double>,Mutex> > init_alpha;
+    hash_map<int, pair<Array<double>,Mutex> > init_beta;
+    map<AlDeps<CLS>,FlexArray<double> > alProb;
+    map<AlDeps<CLS>,FlexArray<double> > alProbPredicted;
+    int globalCounter;
+    double divSum;
+    double p0_count,np0_count;
+    const MAPPERCLASSTOSTRING*mapper1;
+    const MAPPERCLASSTOSTRING*mapper2;
+public:
+    bool merge(HMMTables<CLS,MAPPERCLASSTOSTRING> & ht);
+    const HMMTables<CLS,MAPPERCLASSTOSTRING>*getThis()const {return this;}
+    HMMTables(double _probForEmpty,const MAPPERCLASSTOSTRING&m1,const MAPPERCLASSTOSTRING&m2);
+    virtual ~HMMTables();
+    virtual double getAlProb(int i,int k,int sentLength,int J,CLS w1,CLS w2,int j,int iter=0) const;
+    virtual void writeJumps(ostream&) const;
+    /**By Edward Gao, write out all things needed to rebuild the count table*/
+    virtual bool writeJumps(const char* alprob, const char* alpredict, const char* alpha, const char* beta )const;
+    virtual bool readJumps(const char* alprob, const char* alpredict, const char* alpha, const char* beta );
+    void addAlCount(int i,int k,int sentLength,int J,CLS w1,CLS w2,int j,double value,double valuePredicted);
+    virtual void readJumps(istream&);
+    virtual bool getAlphaInit(int I,Array<double>&x)const;
+    virtual bool getBetaInit(int I,Array<double> &x)const;
+    pair<Array<double>, Mutex> &doGetAlphaInit(int I);
+    pair<Array<double>, Mutex> &doGetBetaInit(int I);
+    virtual double getProbabilityForEmpty()const
+    {return probabilityForEmpty;}  
+    void performGISIteration(const HMMTables<CLS,MAPPERCLASSTOSTRING>*old){
+        cout << "OLDSIZE: " << (old?(old->alProb.size()):0) << " NEWSIZE:"<< alProb.size()<< endl;
+        for(typename map<AlDeps<CLS>,FlexArray<double> >::iterator i=alProb.begin();i!=alProb.end();++i)	{
+            if( alProbPredicted.count(i->first)){
+                normalize_if_possible(i->second.begin(),i->second.end());
+                normalize_if_possible(alProbPredicted[i->first].begin(),alProbPredicted[i->first].end());
+                for(int j=i->second.low();j<=i->second.high();++j){
+                    if( i->second[j] )
+                        if(alProbPredicted[i->first][j]>0.0 )
+                        {
+                            double op=1.0;
+                            if( old && old->alProb.count(i->first) )
+                                op=(old->alProb.find(i->first)->second)[j];
+                            //cerr << "GIS: " << j << ' ' << " OLD:"
+                            //     << op << "*true:" 
+                            //     << i->second[j] << "/pred:" << alProbPredicted[i->first][j] << " -> ";
+                            
+                            
+                            i->second[j]= op*(i->second[j]/alProbPredicted[i->first][j]);
+                            //cerr << i->second[j] << endl;
+                        }
+                    else{
+                        cerr << "ERROR2 in performGISiteration: " << i->second[j] << endl;
+                    }
+                }
+            }
+            else
+                cerr << "ERROR in performGISIteration: " << alProbPredicted.count(i->first) << endl;
+        }
+    }
+};
+
+template<class CLS,class MAPPERCLASSTOSTRING>
+inline void printAlDeps(ostream&out,const AlDeps<CLS>&x,const MAPPERCLASSTOSTRING&mapper1,const MAPPERCLASSTOSTRING&mapper2)
+{
+  if( (CompareAlDeps&1) ) out << "sentenceLength: " << x.englishSentenceLength<< ' ';
+  if( (CompareAlDeps&2) ) out << "previousClass: " << mapper1.classString(x.classPrevious) << ' ';
+  if( (CompareAlDeps&4) ) out << "previousPosition: " << x.previous << ' ';
+  if( (CompareAlDeps&8) ) out << "FrenchPosition: " << x.j << ' ';
+  if( (CompareAlDeps&16) ) out << "FrenchClass: " << mapper2.classString(x.Cj) << ' ';
+  //out << '\n';
+}
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Makefile.am
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Makefile.am
@ -0,0 +1,217 @@
+## Process this file with automake to produce Makefile.in
+
+## Created by Anjuta
+
+INCLUDES = \
+	-DPACKAGE_LOCALE_DIR=\""$(prefix)/$(DATADIRNAME)/locale"\" \
+	-DPACKAGE_SRC_DIR=\""$(srcdir)"\" \
+	-DPACKAGE_DATA_DIR=\""$(datadir)"\" 
+
+AM_CFLAGS =\
+	 -Wall\
+	 -g
+
+bin_PROGRAMS = mgiza \
+	snt2cooc\
+	snt2plain\
+	plain2snt \
+	symal \
+	hmmnorm \
+	d4norm
+
+d4norm_SOURCES = \
+	d4norm.cxx
+
+d4norm_LDADD = \
+	-lgiza \
+	-lpthread
+
+d4norm_LDFLAGS = \
+	-L.
+
+d4norm_DEPENDENCIES = \
+	libgiza.a
+
+d4norm_CXXFLAGS = \
+	-MT \
+	-MD \
+	-MP \
+	-MF \
+	-O6
+
+d4norm_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+hmmnorm_SOURCES = \
+	hmmnorm.cxx
+
+hmmnorm_LDADD = \
+	-lgiza \
+	-lpthread
+
+hmmnorm_LDFLAGS = \
+	-L.
+
+hmmnorm_DEPENDENCIES = \
+	libgiza.a
+
+hmmnorm_CXXFLAGS = \
+	-MT \
+	-MD \
+	-MP \
+	-MF \
+	-O6
+
+hmmnorm_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+symal_SOURCES = \
+	cmd.c  \
+	cmd.h  \
+	symal.cpp
+
+plain2snt_SOURCES = \
+	plain2snt.cpp
+
+snt2plain_SOURCES = \
+	snt2plain.cpp
+
+snt2cooc_SOURCES = \
+	snt2cooc.cpp
+
+snt2cooc_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+mgiza_SOURCES = \
+	main.cpp
+
+mgiza_DEPENDENCIES = \
+	libgiza.a
+
+mgiza_CXXFLAGS = \
+	-MT \
+	-MD \
+	-MP \
+	-MF \
+	-O6
+
+mgiza_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+mgiza_LDFLAGS = \
+	-L.
+
+mgiza_LDADD = \
+	-lgiza \
+	-lpthread
+
+lib_LIBRARIES = \
+	libgiza.a
+
+libgiza_a_SOURCES = \
+	alignment.cpp\
+	alignment.h \
+	AlignTables.cpp \
+	AlignTables.h \
+	Array.h \
+	Array2.h \
+	Array4.h \
+	ATables.cpp \
+	ATables.h \
+	collCounts.cpp \
+	collCounts.h \
+	common.h \
+	D4Tables.h \
+	D5Tables.h \
+	defs.h \
+	Dictionary.cpp \
+	Dictionary.h \
+	file_spec.h \
+	FlexArray.h \
+	ForwardBackward.cpp \
+	ForwardBackward.h \
+	getSentence.cpp \
+	getSentence.h \
+	Globals.h \
+	hmm.cpp \
+	hmm.h \
+	HMMTables.cpp \
+	HMMTables.h \
+	logprob.cpp \
+	logprob.h \
+	model1.cpp \
+	model1.h \
+	model2.cpp \
+	model2.h \
+	model2to3.cpp \
+	model3.cpp \
+	model3.h \
+	model3_viterbi.cpp \
+	model3_viterbi_with_tricks.cpp \
+	model345-peg.cpp \
+	MoveSwapMatrix.cpp \
+	MoveSwapMatrix.h \
+	myassert.cpp \
+	myassert.h \
+	mymath.h \
+	mystl.h \
+	NTables.cpp \
+	NTables.h \
+	Parameter.cpp \
+	Parameter.h \
+	parse.cpp \
+	Perplexity.cpp \
+	Perplexity.h \
+	Pointer.h \
+	reports.cpp \
+	SetArray.cpp \
+	SetArray.h \
+	syncObj.h \
+	transpair_model1.h \
+	transpair_model2.h \
+	transpair_model3.cpp \
+	transpair_model3.h \
+	transpair_model4.cpp \
+	transpair_model4.h \
+	transpair_model5.cpp \
+	transpair_model5.h \
+	transpair_modelhmm.h \
+	ttableDiff.hpp \
+	TTables.cpp \
+	TTables.h \
+	types.h \
+	utility.cpp \
+	utility.h \
+	Vector.h \
+	vocab.cpp \
+	vocab.h \
+	WordClasses.h
+
+libgiza_a_CXXFLAGS = \
+	-MD \
+	-MP \
+	-MF \
+	-MT \
+	-O6
+
+libgiza_a_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+SUBDIRS = \
+	mkcls
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Makefile.am.bak
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Makefile.am.bak
@ -0,0 +1,214 @@
+## Process this file with automake to produce Makefile.in
+
+## Created by Anjuta
+
+INCLUDES = \
+	-DPACKAGE_LOCALE_DIR=\""$(prefix)/$(DATADIRNAME)/locale"\" \
+	-DPACKAGE_SRC_DIR=\""$(srcdir)"\" \
+	-DPACKAGE_DATA_DIR=\""$(datadir)"\" 
+
+AM_CFLAGS =\
+	 -Wall\
+	 -g
+
+bin_PROGRAMS = mgiza \
+	snt2cooc\
+	snt2plain\
+	plain2snt \
+	symal \
+	hmmnorm \
+	d4norm
+
+d4norm_SOURCES = \
+	d4norm.cxx
+
+d4norm_LDADD = \
+	-lgiza \
+	-lpthread
+
+d4norm_LDFLAGS = \
+	-L.
+
+d4norm_DEPENDENCIES = \
+	libgiza.a
+
+d4norm_CXXFLAGS = \
+	-MT \
+	-MD \
+	-MP \
+	-MF \
+	-O6
+
+d4norm_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+hmmnorm_SOURCES = \
+	hmmnorm.cxx
+
+hmmnorm_LDADD = \
+	-lgiza \
+	-lpthread
+
+hmmnorm_LDFLAGS = \
+	-L.
+
+hmmnorm_DEPENDENCIES = \
+	libgiza.a
+
+hmmnorm_CXXFLAGS = \
+	-MT \
+	-MD \
+	-MP \
+	-MF \
+	-O6
+
+hmmnorm_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+symal_SOURCES = \
+	cmd.c  \
+	cmd.h  \
+	symal.cpp
+
+plain2snt_SOURCES = \
+	plain2snt.cpp
+
+snt2plain_SOURCES = \
+	snt2plain.cpp
+
+snt2cooc_SOURCES = \
+	snt2cooc.cpp
+
+snt2cooc_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+mgiza_SOURCES = \
+	main.cpp
+
+mgiza_DEPENDENCIES = \
+	libgiza.a
+
+mgiza_CXXFLAGS = \
+	-MT \
+	-MD \
+	-MP \
+	-MF \
+	-O6
+
+mgiza_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
+mgiza_LDFLAGS = \
+	-L.
+
+mgiza_LDADD = \
+	-lgiza \
+	-lpthread
+
+lib_LIBRARIES = \
+	libgiza.a
+
+libgiza_a_SOURCES = \
+	alignment.cpp\
+	alignment.h \
+	AlignTables.cpp \
+	AlignTables.h \
+	Array.h \
+	Array2.h \
+	Array4.h \
+	ATables.cpp \
+	ATables.h \
+	collCounts.cpp \
+	collCounts.h \
+	common.h \
+	D4Tables.h \
+	D5Tables.h \
+	defs.h \
+	Dictionary.cpp \
+	Dictionary.h \
+	file_spec.h \
+	FlexArray.h \
+	ForwardBackward.cpp \
+	ForwardBackward.h \
+	getSentence.cpp \
+	getSentence.h \
+	Globals.h \
+	hmm.cpp \
+	hmm.h \
+	HMMTables.cpp \
+	HMMTables.h \
+	logprob.cpp \
+	logprob.h \
+	model1.cpp \
+	model1.h \
+	model2.cpp \
+	model2.h \
+	model2to3.cpp \
+	model3.cpp \
+	model3.h \
+	model3_viterbi.cpp \
+	model3_viterbi_with_tricks.cpp \
+	model345-peg.cpp \
+	MoveSwapMatrix.cpp \
+	MoveSwapMatrix.h \
+	myassert.cpp \
+	myassert.h \
+	mymath.h \
+	mystl.h \
+	NTables.cpp \
+	NTables.h \
+	Parameter.cpp \
+	Parameter.h \
+	parse.cpp \
+	Perplexity.cpp \
+	Perplexity.h \
+	Pointer.h \
+	reports.cpp \
+	SetArray.cpp \
+	SetArray.h \
+	syncObj.h \
+	transpair_model1.h \
+	transpair_model2.h \
+	transpair_model3.cpp \
+	transpair_model3.h \
+	transpair_model4.cpp \
+	transpair_model4.h \
+	transpair_model5.cpp \
+	transpair_model5.h \
+	transpair_modelhmm.h \
+	ttableDiff.hpp \
+	TTables.cpp \
+	TTables.h \
+	types.h \
+	utility.cpp \
+	utility.h \
+	Vector.h \
+	vocab.cpp \
+	vocab.h \
+	WordClasses.h
+
+libgiza_a_CXXFLAGS = \
+	-MD \
+	-MP \
+	-MF \
+	-MT \
+	-O6
+
+libgiza_a_CPPFLAGS = \
+	-DNDEBUG \
+	-DWORDINDEX_WITH_4_BYTE \
+	-DBINARY_SEARCH_FOR_TTABLE \
+	-DDEBUG
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Makefile.in
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Makefile.in
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/MoveSwapMatrix.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/MoveSwapMatrix.cpp
@ -0,0 +1,235 @@
+/*
+
+Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#include "MoveSwapMatrix.h"
+
+template<class TRANSPAIR>
+MoveSwapMatrix<TRANSPAIR>::MoveSwapMatrix(const TRANSPAIR&_ef, const alignment&_a)
+  : alignment(_a), ef(_ef), l(ef.get_l()), m(ef.get_m()), _cmove(l+1, m+1), _cswap(m+1, m+1), 
+  delmove(l+1, m+1,0),delswap(m+1, m+1,0),changed(l+2, 0), changedCounter(1), 
+  modelnr(_ef.modelnr()),lazyEvaluation(0),centerDeleted(0)
+{
+  double thisValue=ef.scoreOfAlignmentForChange((*this));
+  if( lazyEvaluation==0)
+    for(WordIndex j=1;j<=m;j++)updateJ(j, 0,thisValue);
+}
+
+template<class TRANSPAIR>
+void MoveSwapMatrix<TRANSPAIR>::updateJ(WordIndex j, bool useChanged,double thisValue)
+{
+  massert( lazyEvaluation==0 );
+  for(WordIndex i=0;i<=l;i++)
+    if( (useChanged==0||changed[i]!=changedCounter) )
+      if( get_al(j)!=i ) 
+	_cmove(i, j)=ef.scoreOfMove((*this), i, j,thisValue);
+      else
+	_cmove(i, j)=1.0;
+  for(WordIndex j2=j+1;j2<=m;j2++)
+    if( get_al(j)!=get_al(j2) )
+      _cswap(j, j2)=ef.scoreOfSwap((*this), j, j2,thisValue);
+    else
+      _cswap(j, j2)=1.0;
+  for(WordIndex j2=1;j2<j;j2++)
+    if( get_al(j)!=get_al(j2) )
+      _cswap(j2, j)=ef.scoreOfSwap((*this), j2, j,thisValue);
+    else
+      _cswap(j2, j)=1.0;
+}
+template<class TRANSPAIR>
+void MoveSwapMatrix<TRANSPAIR>::updateI(WordIndex i,double thisValue)
+{
+  massert( lazyEvaluation==0);
+  for(WordIndex j=1;j<=m;j++)
+    if( get_al(j)!=i )
+      _cmove(i, j)=ef.scoreOfMove((*this), i, j,thisValue);
+    else
+      _cmove(i, j)=1.0;
+}
+
+template<class TRANSPAIR>
+void MoveSwapMatrix<TRANSPAIR>::printWrongs()const{
+  for(WordIndex i=0;i<=l;i++)
+    {
+      for(WordIndex j=1;j<=m;j++)
+	if( get_al(j)==i)
+	  cout << "A";
+	else
+	  {
+	    LogProb real=_cmove(i, j), wanted=ef.scoreOfMove((*this), i, j);
+	    if( fabs(1.0-real/wanted)>1e-3 )
+	      cout << 'b';
+	    else if(fabs(1.0-real/wanted)>1e-10 )
+	      cout << 'e';
+	    else if(real!=wanted)
+	      cout << 'E';
+	    else
+	      cout << ' ';
+	  }
+      cout << endl;
+    }
+  cout << endl;
+  for(WordIndex j=1;j<=m;j++)
+    {
+      for(WordIndex j1=1;j1<=m;j1++)
+	if( j1>j )
+	  {
+	    if( get_al(j)==get_al(j1) )
+	      cout << 'A';
+	    else 
+	      cout << (_cswap(j, j1)==ef.scoreOfSwap((*this), j, j1));
+	  }
+	else
+	  cout << ' ';
+      cout << endl;  
+    }
+  massert(0);
+}
+template<class TRANSPAIR>
+bool MoveSwapMatrix<TRANSPAIR>::isRight()const{
+  if( lazyEvaluation ) 
+    return 1;
+  for(WordIndex i=0;i<=l;i++)
+    for(WordIndex j=1;j<=m;j++)
+      if( get_al(j)!=i && (!(doubleEqual(_cmove(i, j), ef.scoreOfMove((*this), i, j)))) )
+	{
+	  cerr << "DIFF: " << i << " " << j << " " << _cmove(i, j) << " " << ef.scoreOfMove((*this), i, j) << endl;
+	  return 0;
+	}
+  for(WordIndex j=1;j<=m;j++)
+    for(WordIndex j1=1;j1<=m;j1++)
+      if( j1>j&&get_al(j)!=get_al(j1)&&(!doubleEqual(_cswap(j, j1), ef.scoreOfSwap((*this), j, j1))) )
+	{
+	  cerr << "DIFFERENT: " << j << " " << j1 << " " << _cswap(j, j1) << " " << ef.scoreOfSwap((*this), j, j1) << endl;
+	  return 0;
+	}
+  return 1;
+}
+
+template<class TRANSPAIR>
+void MoveSwapMatrix<TRANSPAIR>::doMove(WordIndex _i, WordIndex _j)
+{
+  WordIndex old_i=get_al(_j);
+  if(old_i>100){
+	  cerr << "Error, invalid index set";
+	  return;
+  }
+  if( lazyEvaluation )
+    set(_j,_i);
+  else
+    {
+      if ( modelnr==5||modelnr==6 )
+	{
+	  set(_j, _i);
+	  double thisValue=ef.scoreOfAlignmentForChange((*this));
+	  for(WordIndex j=1;j<=m;j++)updateJ(j, 0,thisValue);
+	}
+      else if ( modelnr==4 )
+	{
+	  changedCounter++;
+	  for(unsigned int k=prev_cept(old_i);k<=next_cept(old_i);++k)changed[k]=changedCounter;
+	  for(unsigned int k=prev_cept(_i);k<=next_cept(_i);++k)changed[k]=changedCounter;
+	  set(_j, _i);
+	  for(unsigned int k=prev_cept(old_i);k<=next_cept(old_i);++k)changed[k]=changedCounter;
+	  for(unsigned int k=prev_cept(_i);k<=next_cept(_i);++k)changed[k]=changedCounter;
+	  double thisValue=ef.scoreOfAlignmentForChange((*this));
+	  for(unsigned int i=0;i<=l;i++)
+	    if(changed[i]==changedCounter)
+	      updateI(i,thisValue);
+	  for(unsigned int j=1;j<=m;j++)
+	    if( changed[get_al(j)]==changedCounter )
+	      updateJ(j, 1,thisValue);
+	}
+      else
+	{
+	  assert(modelnr==3);
+	  set(_j, _i);
+	  changedCounter++;
+	  double thisValue=ef.scoreOfAlignmentForChange((*this));
+	  updateI(old_i,thisValue);
+	  changed[old_i]=changedCounter;
+	  updateI(_i,thisValue);
+	  changed[_i]=changedCounter;
+	  for(WordIndex j=1;j<=m;j++)
+	    if( get_al(j)==_i || get_al(j)==old_i )
+	      updateJ(j, 1,thisValue);
+	}
+    }
+}
+template<class TRANSPAIR>
+void MoveSwapMatrix<TRANSPAIR>::doSwap(WordIndex _j1, WordIndex _j2)
+{
+  assert( cswap(_j1, _j2)>1 );
+  WordIndex i1=get_al(_j1), i2=get_al(_j2);
+  if( lazyEvaluation==1 )
+    {
+      set(_j1, i2);
+      set(_j2, i1);
+    }
+  else
+    {
+      if ( modelnr==5||modelnr==6 )
+	{
+	  set(_j1, i2);
+	  set(_j2, i1);
+	  double thisValue=ef.scoreOfAlignmentForChange((*this));
+	  for(WordIndex j=1;j<=m;j++)updateJ(j, 0,thisValue);
+	}
+      else if( modelnr==4 )
+	{
+	  changedCounter++;
+	  for(unsigned int k=prev_cept(i1);k<=next_cept(i1);++k)changed[k]=changedCounter;
+	  for(unsigned int k=prev_cept(i2);k<=next_cept(i2);++k)changed[k]=changedCounter;
+	  set(_j1, i2);
+	  set(_j2, i1);
+	  double thisValue=ef.scoreOfAlignmentForChange((*this));
+	  for(unsigned int i=0;i<=l;i++)
+	    if(changed[i]==changedCounter)
+	      updateI(i,thisValue);
+	  for(unsigned int j=1;j<=m;j++)
+	    if( changed[get_al(j)]==changedCounter )
+	      updateJ(j, 1,thisValue);
+	}
+      else
+	{
+	  assert(modelnr==3);
+	  set(_j1, i2);
+	  set(_j2, i1);
+	  changedCounter++;
+	  double thisValue=ef.scoreOfAlignmentForChange((*this));
+	  updateI(i1,thisValue);
+	  changed[i1]=changedCounter;
+	  updateI(i2,thisValue);
+	  changed[i2]=changedCounter;
+	  updateJ(_j1, 1,thisValue);
+	  updateJ(_j2, 1,thisValue);
+	}
+    }
+}
+
+#include "transpair_model3.h"
+#include "transpair_model4.h"
+#include "transpair_model5.h"
+#include "transpair_modelhmm.h"
+template class MoveSwapMatrix<transpair_model3>;
+template class MoveSwapMatrix<transpair_model4>;
+template class MoveSwapMatrix<transpair_model5>;
+template class MoveSwapMatrix<transpair_modelhmm>;
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/MoveSwapMatrix.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/MoveSwapMatrix.h
@ -0,0 +1,162 @@
+/*
+
+ EGYPT Toolkit for Statistical Machine Translation
+ Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful,
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307,
+ USA.
+
+ */
+/*--
+ MoveSwapMatrix: Efficient representation for moving and swapping
+ around in IBM3 training.
+ Franz Josef Och (30/07/99)
+ --*/
+#ifndef moveswap2_costs_h_defined
+#define moveswap2_costs_h_defined
+#include "alignment.h"
+#include "transpair_model3.h"
+#include "myassert.h"
+#include <set>
+#include <map>
+#include <vector>
+
+extern short DoViterbiTraining;
+
+template<class TRANSPAIR>
+class MoveSwapMatrix: public alignment {
+private:
+	const TRANSPAIR&ef;
+	const WordIndex l, m;
+	Array2<LogProb, Vector<LogProb> > _cmove, _cswap;
+	Array2<char, Vector<char> > delmove, delswap;
+	Vector<int> changed;
+	int changedCounter;
+	const int modelnr;
+	bool lazyEvaluation;
+	bool centerDeleted;
+	std::map<int,std::set<int> >untouch_i; // target words that should not be aligned anywhere
+	std::map<int,std::set<int> > untouch_j;
+public:
+	void addUnTouchI(int i, int j){
+		if(i>0){
+			if(untouch_i.find(i)==untouch_i.end()){
+				untouch_i[i] = std::set<int>();
+			}
+			untouch_i[i].insert(j);
+
+		}
+	}
+
+	void addUnTouchJ(int j,int i){
+		if(j>0){
+			if(untouch_j.find(j)==untouch_j.end()){
+				untouch_j[j] = std::set<int>();
+			}
+			untouch_j[j].insert(i);
+		}
+	}
+
+	bool check() const {
+		return 1;
+	}
+	const TRANSPAIR&get_ef() const {
+		return ef;
+	}
+	bool isCenterDeleted() const {
+		return centerDeleted;
+	}
+	bool isLazy() const {
+		return lazyEvaluation;
+	}
+	MoveSwapMatrix(const TRANSPAIR&_ef, const alignment&_a);
+	void updateJ(WordIndex j, bool, double thisValue);
+	void updateI(WordIndex i, double thisValue);
+	void doMove(WordIndex _i, WordIndex _j);
+	void doSwap(WordIndex _j1, WordIndex _j2);
+	void delCenter() {
+		centerDeleted = 1;
+	}
+	void delMove(WordIndex x, WordIndex y) {
+		delmove(x, y) = 1;
+	}
+	void delSwap(WordIndex x, WordIndex y) {
+		massert(y>x);
+		delswap(x, y) = 1;
+		delswap(y, x) = 1;
+	}
+	bool isDelMove(WordIndex x, WordIndex y) const {
+		return DoViterbiTraining || delmove(x, y);
+	}
+	bool isDelSwap(WordIndex x, WordIndex y) const {
+		massert(y>x);
+		return DoViterbiTraining || delswap(x, y);
+	}
+	LogProb cmove(WordIndex x, WordIndex y) const {
+		massert( get_al(y)!=x );
+		massert( delmove(x,y)==0 );
+		if (lazyEvaluation)
+			return ef.scoreOfMove(*this, x, y);
+		else {
+			std::map<int, std::set<int> >::const_iterator it;
+
+			it = untouch_i.find(x);
+			if(it!=untouch_i.end()){
+				// Return -1 if the j jump set is not within the limit
+				if(it->second.find(y) == it->second.end()) //Not in the feasible set
+					return -1;
+			}
+			it = untouch_j.find(y);
+			if(it!=untouch_j.end()){
+				if(it->second.find(x) == it->second.end()) //Not in the feasible set
+			return -1;
+			}
+			return _cmove(x, y);
+		}
+	}
+	LogProb cswap(WordIndex x, WordIndex y) const {
+		massert(x<y);
+		massert(delswap(x,y)==0);
+		massert(get_al(x)!=get_al(y));
+		if (lazyEvaluation)
+			return ef.scoreOfSwap(*this, x, y);
+		else {
+			massert(y>x);
+			std::map<int, std::set<int> >::const_iterator it1,it2;
+			it1 =untouch_j.find(y);
+			it2 = untouch_j.find(x);
+			int nal1 = get_al(y);
+			int nal2 = get_al(x); // Need to test if nal1 is in it2's feasible set
+			                      // and vice versa
+
+			if(it1!=untouch_j.end()&&it1->second.find(nal2)==it1->second.end()){
+				return -1;
+			}
+			if(it2!=untouch_j.end()&&it2->second.find(nal1)==it2->second.end()){
+				return -1;
+			}
+			// Make sure we never swap these
+			return _cswap(x, y);
+		}
+	}
+	void printWrongs() const;
+	bool isRight() const;
+	friend ostream&operator<<(ostream&out, const MoveSwapMatrix<TRANSPAIR>&m) {
+		return out << (alignment) m << "\nEF:\n" << m.ef << "\nCMOVE\n"
+				<< m._cmove << "\nCSWAP\n" << m._cswap << endl;
+	}
+	;
+};
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/NTables.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/NTables.cpp
@ -0,0 +1,184 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#include "NTables.h"
+#include <iostream>
+#include "defs.h"
+#include <fstream>
+#include "Parameter.h"
+
+GLOBAL_PARAMETER(double,NTablesFactorGraphemes,"nSmooth","smoothing for fertility parameters (good value: 64): weight for wordlength-dependent fertility parameters",PARLEV_SMOOTH,64.0);
+GLOBAL_PARAMETER(double,NTablesFactorGeneral,"nSmoothGeneral","smoothing for fertility parameters (default: 0): weight for word-independent fertility parameters",PARLEV_SMOOTH,0.0);
+
+template <class VALTYPE>
+void nmodel<VALTYPE>::printNTable(int noEW, const char* filename, 
+				  const Vector<WordEntry>& evlist, 
+				  bool actual) const
+     // prints the fertility table but with actual sourcce words (not their id)
+{
+    cerr << "Dumping nTable to: " << filename <<  '\n';  
+    ofstream of(filename);
+    VALTYPE p ;
+    WordIndex k, i ;
+    for(i=1; int(i) < noEW; i++){
+        if (evlist[i].freq > 0){
+            if (actual)
+                of << evlist[i].word << ' ' ;
+            else 
+                of << i << ' ' ;
+            for( k=0; k < MAX_FERTILITY; k++){
+                p = getValue(i, k);
+                if (p <= PROB_SMOOTH) 
+                    p = 0;
+                of << p << ' ';      
+            } 
+            of << '\n';
+        }
+    }
+}
+
+template <class VALTYPE>
+void nmodel<VALTYPE>::printRealNTable(int noEW, const char* filename, 
+				  const Vector<WordEntry>& evlist, 
+				  bool actual) const
+     // prints the fertility table but with actual sourcce words (not their id)
+{
+    cerr << "Dumping nTable to: " << filename <<  '\n';  
+    ofstream of(filename);
+    VALTYPE p ;
+    WordIndex k, i ;
+    for(i=1; int(i) < noEW; i++){
+        if (evlist[i].freq > 0){
+            if (actual)
+                of << evlist[i].word << ' ' ;
+            else 
+                of << i << ' ' ;
+            for( k=0; k < MAX_FERTILITY; k++){
+                p = getValue(i, k);
+//                if (p <= PROB_SMOOTH) 
+//                    p = 0;
+                of << p << ' ';      
+            } 
+            of << '\n';
+        }
+    }
+}
+
+template <class VALTYPE>
+bool nmodel<VALTYPE>::readNTable(const char *filename){
+  /* This function reads the n table from a file.
+     Each line is of the format:  source_word_id p0 p1 p2 ... pn
+     This is the inverse operation of the printTable function.
+     NAS, 7/11/99
+  */
+    ifstream inf(filename);
+    if(!inf.is_open()){
+        return false;
+    }
+    cerr << "Reading fertility table from " << filename << "\n";
+    if(!inf){
+        cerr << "\nERROR: Cannot open " << filename <<"\n";
+        return false;
+    }
+    
+    VALTYPE prob;
+    WordIndex tok, i;
+    int nFert=0;
+    while(!inf.eof()){
+        nFert++;
+        inf >> ws >> tok;
+        if (tok > MAX_VOCAB_SIZE){
+            cerr << "NTables:readNTable(): unrecognized token id: " << tok
+                <<'\n';
+            exit(-1);
+        }
+        for(i = 0; i < MAX_FERTILITY; i++){
+            inf >> ws >> prob;
+            getRef(tok, i)=prob;
+        }
+    }
+    cerr << "Read " << nFert << " entries in fertility table.\n";
+    inf.close();
+    return true;
+}
+
+template <class VALTYPE>
+bool nmodel<VALTYPE>::merge(nmodel<VALTYPE>& n,int noEW, const Vector<WordEntry>& evlist){
+  /* This function reads the n table from a file.
+     Each line is of the format:  source_word_id p0 p1 p2 ... pn
+     This is the inverse operation of the printTable function.
+     NAS, 7/11/99
+  */
+
+    
+    VALTYPE p ;
+    WordIndex k, i ;
+    for(i=1; int(i) < noEW; i++){
+        if (evlist[i].freq > 0){
+            for( k=0; k < MAX_FERTILITY; k++){
+                p = n.getValue(i, k);
+                getRef(i,k)+=p;
+            } 
+        }
+    }
+    return true;
+}
+
+template <class VALTYPE>
+bool nmodel<VALTYPE>::readAugNTable(const char *filename){
+  /* This function reads the n table from a file.
+     Each line is of the format:  source_word_id p0 p1 p2 ... pn
+     This is the inverse operation of the printTable function.
+     NAS, 7/11/99
+  */
+    ifstream inf(filename);
+    if(!inf.is_open()){
+        return false;
+    }
+    cerr << "Reading fertility table from " << filename << "\n";
+    if(!inf){
+        cerr << "\nERROR: Cannot open " << filename <<"\n";
+        return false;
+    }
+    
+    VALTYPE prob;
+    WordIndex tok, i;
+    int nFert=0;
+    while(!inf.eof()){
+        nFert++;
+        inf >> ws >> tok;
+        if (tok > MAX_VOCAB_SIZE){
+            cerr << "NTables:readNTable(): unrecognized token id: " << tok
+                <<'\n';
+            exit(-1);
+        }
+        for(i = 0; i < MAX_FERTILITY; i++){
+            inf >> ws >> prob;
+            getRef(tok, i)+=prob;
+        }
+    }
+    cerr << "Read " << nFert << " entries in fertility table.\n";
+    inf.close();
+    return true;
+}
+
+template class nmodel<COUNT>;
+//template class nmodel<PROB>;
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/NTables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/NTables.h
@ -0,0 +1,145 @@
+/*
+
+ EGYPT Toolkit for Statistical Machine Translation
+ Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful, 
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+ USA.
+
+ */
+#ifndef _ntables_h
+#define _ntables_h 1
+#include "Array2.h"
+#include "Vector.h"
+#include <cassert>
+#include "defs.h"
+#include "vocab.h"
+#include "myassert.h"
+#include "Globals.h"
+#include "syncObj.h"
+
+extern double NTablesFactorGraphemes, NTablesFactorGeneral;
+
+template<class VALTYPE> class nmodel {
+private:
+	Array2<VALTYPE, Vector<VALTYPE> > ntab;
+public:
+	nmodel(int maxw, int maxn) :
+		ntab(maxw, maxn, 0.0) {
+	}
+	VALTYPE getValue(int w, unsigned int n) const {
+		massert(w!=0);
+		if (n>=ntab.getLen2())
+			return 0.0;
+		else
+			return max(ntab(w, n), VALTYPE(PROB_SMOOTH));
+	}
+protected:
+	inline VALTYPE&getRef(int w, int n) {
+		//massert(w!=0);
+		return ntab(w, n);
+	};
+	Mutex lock;
+public:
+	inline void addValue(int w , int n,const VALTYPE& t){lock.lock();ntab(w,n)+=t;lock.unlock();};
+public:
+	template<class COUNT> void normalize(nmodel<COUNT>&write,
+			const Vector<WordEntry>* _evlist) const {
+		int h1=ntab.getLen1(), h2=ntab.getLen2();
+		int nParams=0;
+		if (_evlist&&(NTablesFactorGraphemes||NTablesFactorGeneral)) {
+			size_t maxlen=0;
+			const Vector<WordEntry>&evlist=*_evlist;
+			for (unsigned int i=1; i<evlist.size(); i++)
+				maxlen=max(maxlen, evlist[i].word.length());
+			Array2<COUNT,Vector<COUNT> > counts(maxlen+1, MAX_FERTILITY+1, 0.0);
+			Vector<COUNT> nprob_general(MAX_FERTILITY+1,0.0);
+			for (unsigned int i=1; i<min((unsigned int)h1,
+					(unsigned int)evlist.size()); i++) {
+				int l=evlist[i].word.length();
+				for (int k=0; k<h2; k++) {
+					counts(l, k)+=getValue(i, k);
+					nprob_general[k]+=getValue(i, k);
+				}
+			}
+			COUNT sum2=0;
+			for (unsigned int i=1; i<maxlen+1; i++) {
+				COUNT sum=0.0;
+				for (int k=0; k<h2; k++)
+					sum+=counts(i, k);
+				sum2+=sum;
+				if (sum) {
+					double average=0.0;
+					//cerr << "l: " << i << " " << sum << " ";
+					for (int k=0; k<h2; k++) {
+						counts(i, k)/=sum;
+						//cerr << counts(i,k) << ' ';
+						average+=k*counts(i, k);
+					}
+					//cerr << "avg: " << average << endl;
+					//cerr << '\n';
+				}
+			}
+			for (unsigned int k=0; k<nprob_general.size(); k++)
+				nprob_general[k]/=sum2;
+
+			for (int i=1; i<h1; i++) {
+				int l=-1;
+				if ((unsigned int)i<evlist.size())
+					l=evlist[i].word.length();
+				COUNT sum=0.0;
+				for (int k=0; k<h2; k++)
+					sum+=getValue(i, k)+((l==-1) ? 0.0 : (counts(l, k)
+							*NTablesFactorGraphemes)) + NTablesFactorGeneral
+							*nprob_general[k];
+				assert(sum);
+				for (int k=0; k<h2; k++) {
+					write.getRef(i, k)=(getValue(i, k)+((l==-1) ? 0.0
+							: (counts(l, k)*NTablesFactorGraphemes)))/sum
+							+ NTablesFactorGeneral*nprob_general[k];
+					nParams++;
+				}
+			}
+		} else
+			for (int i=1; i<h1; i++) {
+				COUNT sum=0.0;
+				for (int k=0; k<h2; k++)
+					sum+=getValue(i, k);
+				assert(sum);
+				for (int k=0; k<h2; k++) {
+					write.getRef(i, k)=getValue(i, k)/sum;
+					nParams++;
+				}
+			}
+		cerr << "NTable contains " << nParams << " parameter.\n";
+	}
+
+	bool merge(nmodel<VALTYPE>& n, int noEW, const Vector<WordEntry>& evlist);
+	void clear() {
+		int h1=ntab.getLen1(), h2=ntab.getLen2();
+		for (int i=0; i<h1; i++)
+			for (int k=0; k<h2; k++)
+				ntab(i, k)=0;
+	}
+	void printNTable(int noEW, const char* filename,
+			const Vector<WordEntry>& evlist, bool) const;
+	void printRealNTable(int noEW, const char* filename,
+			const Vector<WordEntry>& evlist, bool) const;
+	bool readAugNTable(const char *filename);
+	bool readNTable(const char *filename);
+
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Parameter.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Parameter.cpp
@ -0,0 +1,144 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#include "Parameter.h"
+#include "fstream"
+#include "unistd.h"
+#include <strstream>
+
+
+bool absolutePathNames=0;
+string ParameterPathPrefix;
+bool ParameterChangedFlag=0;
+
+bool writeParameters(ofstream&of,const ParSet&parset,int level)
+{
+  if(!of)return 0;
+  for(ParSet::const_iterator i=parset.begin();i!=parset.end();++i)
+    {
+      if(((*i)->getLevel()==level||level==-1)&&(*i)->onlyCopy==0)
+	{
+	  ostrstream os;
+	  (*i)->printValue(os);
+	  os << ends;
+	  string s(os.str());
+	  of << (*i)->getString() << " ";
+	  if( absolutePathNames&&(*i)->isFilename()&&s.length()&&s[0]!='/' )
+	    {
+	      char path[1024];
+	      getcwd(path,1024);
+	      of << path << '/';
+	    }
+	  if( ParameterPathPrefix.length()&&(*i)->isFilename()&&s.length()&&s[0]!='/' )
+	    of << ParameterPathPrefix << '/'; 
+	  (*i)->printValue(of);
+	  of << endl;
+	}
+    }
+  return 1;
+}
+
+bool readParameters(ifstream&f,const ParSet&parset,int verb,int level)
+{
+  string s;
+  if(!f)return 0;
+  while(getline(f,s))
+    {
+      istrstream eingabe(s.c_str());
+      string s1,s2;
+      eingabe>>s1>>s2;
+      if(makeSetCommand(s1,s2,parset,verb,level)==0)
+	cerr << "ERROR: could not set: (C) " << s1 << " " << s2 << endl;
+    }
+  return 1;
+}
+
+ 
+bool makeSetCommand(string _s1,string s2,const ParSet&parset,int verb,int level)
+{
+  ParPtr anf;
+  int anfset=0;
+  string s1=simpleString(_s1);
+  for(ParSet::const_iterator i=parset.begin();i!=parset.end();++i)
+    {
+      if( *(*i)==s1 )
+	{
+	  if( level==-1 || level==(*i)->getLevel() )
+	    (*i)->setParameter(s2,verb);
+	  else if(verb>1)
+	    cerr << "ERROR: Could not set: (A) " << s1 << " " << s2 << " " << level << " " << (*i)->getLevel() << endl;
+	  return 1;
+	}
+      else if( (*i)->getString().substr(0,s1.length())==s1 )
+	{
+	  anf=(*i);anfset++;
+	}
+    }
+  if(anfset==1)
+    {
+      if( level==-1 || level==anf->getLevel() )
+	anf->setParameter(s2,verb);
+      else if( verb>1 )
+	cerr << "ERROR: Could not set: (B) " << s1 << " " << s2 << " " << level << " " << anf->getLevel() << endl;
+      return 1;
+    }
+  if( anfset>1 )
+    cerr << "ERROR: ambiguous parameter '" << s1 << "'.\n";
+  if( anfset==0 )
+    cerr << "ERROR: parameter '" << s1 << "' does not exist.\n";
+  return 0;
+}
+
+ostream& printPars(ostream&of,const ParSet&parset,int level)
+{
+  if(!of)return of;
+  for(ParSet::const_iterator i=parset.begin();i!=parset.end();++i)
+    {
+      if(((*i)->getLevel()==level||level==-1)&&(*i)->onlyCopy==0)
+	{
+	  (*i)->printAt(of);
+	  of << endl;
+	}
+    }
+  return of;
+}
+
+string simpleString(const string s)
+{
+  string k;
+  for(unsigned int i=0;i<s.length();++i)
+    {
+      char c[2];
+      c[0]=tolower(s[i]);
+      c[1]=0;
+      if( (c[0]>='a'&&c[0]<='z')||(c[0]>='0'&&c[0]<='9') )
+	k += c;
+    }
+  return k;
+}
+
+
+ParSet&getGlobalParSet()
+{
+  static ParSet x;
+  return x;
+}
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Parameter.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Parameter.h
@ -0,0 +1,200 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef PARAMETER_H_DEFINED
+#define PARAMETER_H_DEFINED
+
+#include "mystl.h"
+#include <set>
+#include "Pointer.h"
+#include <string>
+#include "Globals.h"
+#include <fstream>
+#include <cstring>
+
+inline unsigned int mConvert(const string&s,unsigned int &i)
+{ 
+  if( strcasecmp(s.c_str(),"yes")==0 || strcasecmp(s.c_str(),"y")==0 || strcasecmp(s.c_str(),"true")==0 || strcasecmp(s.c_str(),"t")==0 ) { cerr << "TRUE\n";return i=1; }
+  if( strcasecmp(s.c_str(),"no")==0 ||  strcasecmp(s.c_str(),"n")==0 ||  strcasecmp(s.c_str(),"false")==0 ||  strcasecmp(s.c_str(),"f")==0 ) { cerr << "FALSE\n";return i=0;}
+  return i=atoi(s.c_str()); 
+}
+inline int mConvert(const string&s,int &i){ 
+  if( strcasecmp(s.c_str(),"yes")==0 ||  strcasecmp(s.c_str(),"y")==0 ||  strcasecmp(s.c_str(),"true")==0 ||  strcasecmp(s.c_str(),"t")==0 ) { cerr << "TRUE\n";return i=1;}
+  if( strcasecmp(s.c_str(),"no")==0 ||  strcasecmp(s.c_str(),"n")==0 ||  strcasecmp(s.c_str(),"false")==0 ||  strcasecmp(s.c_str(),"f")==0 ) { cerr << "FALSE\n";return i=0;}
+  return i=atoi(s.c_str()); 
+}
+inline double mConvert(const string&s,double &d) { return d=atof(s.c_str()); }
+inline double mConvert(const string&s,float &d) { return d=atof(s.c_str()); }
+inline string mConvert(const string&s,string&n) { return n=s; }
+inline bool mConvert(const string&s,bool&n) { 
+  if( strcasecmp(s.c_str(),"yes")==0 ||  strcasecmp(s.c_str(),"y")==0 ||  strcasecmp(s.c_str(),"true")==0 ||  strcasecmp(s.c_str(),"t")==0 ) { cerr << "TRUE\n";return n=1;}
+  if( strcasecmp(s.c_str(),"no")==0 ||  strcasecmp(s.c_str(),"n")==0 ||  strcasecmp(s.c_str(),"false")==0 ||  strcasecmp(s.c_str(),"f")==0 ) { cerr << "FALSE\n";return n=0;}
+  return n=atoi(s.c_str()); 
+}
+inline short mConvert(const string&s,short&n) { 
+  if( strcasecmp(s.c_str(),"yes")==0 ||  strcasecmp(s.c_str(),"y")==0 ||  strcasecmp(s.c_str(),"true")==0 ||  strcasecmp(s.c_str(),"t")==0 ) { cerr << "TRUE\n";return n=1;}
+  if( strcasecmp(s.c_str(),"no")==0 ||  strcasecmp(s.c_str(),"n")==0 ||  strcasecmp(s.c_str(),"false")==0 ||  strcasecmp(s.c_str(),"f")==0 ) { cerr << "FALSE\n";return n=0;}
+  return n=atoi(s.c_str()); 
+}
+inline unsigned short mConvert(const string&s,unsigned short&n) { 
+  if( strcasecmp(s.c_str(),"yes")==0 ||  strcasecmp(s.c_str(),"y")==0 ||  strcasecmp(s.c_str(),"true")==0 ||  strcasecmp(s.c_str(),"t")==0 ) { cerr << "TRUE\n";return n=1;}
+  if( strcasecmp(s.c_str(),"no")==0 ||  strcasecmp(s.c_str(),"n")==0 ||  strcasecmp(s.c_str(),"false")==0 ||  strcasecmp(s.c_str(),"f")==0 ) { cerr << "FALSE\n";return n=0;}
+  return n=atoi(s.c_str()); 
+}
+
+string simpleString(const string s);
+
+inline int Hashstring(const string& s)
+{
+  int sum=0;
+  string::const_iterator i=s.begin(),end=s.end();
+  for(;i!=end;i++)sum=5*sum+(*i);
+  return sum;
+}
+
+class _Parameter
+{
+ protected:
+  string name;
+  bool *ifChanged;
+  string description;
+  int level;
+  bool filename;
+ public:
+  int onlyCopy;
+  _Parameter(string n,bool&b,string desc,int _level,bool _onlyCopy)
+    : name(simpleString(n)),ifChanged(&b),description(desc),level(_level),filename(0),onlyCopy(_onlyCopy) {}
+  virtual ~_Parameter(){};
+  bool operator==(const string&s)const
+    { return name== simpleString(s); }
+  void setChanged() 
+    { *ifChanged=true; }
+  virtual bool setParameter(string s2,int)=0;
+  virtual ostream&printAt(ostream&out)=0;
+  virtual ostream&printValue(ostream&out)=0;
+  const string&getString() const { return name; }
+  int getLevel() const { return level;}
+  bool isFilename() { return filename;}
+  void setFilename(bool x=1) { filename=x;}
+  friend bool operator==(const _Parameter&a,const _Parameter&b)
+    { return a.name==b.name; }
+  friend bool operator<(const _Parameter&a,const _Parameter&b)
+    { return a.name<b.name; }
+  friend int Hash(const _Parameter&aaa)
+    { return Hashstring(aaa.name); }
+  friend ostream&operator<<(ostream&out,const _Parameter&p)
+    { return out<<"Parameter: "<<p.name <<endl;}
+};
+
+template<class T>
+class Parameter : public _Parameter
+{
+ private:
+  T*t;
+ public:
+  Parameter(string n,bool&b,string desc,T&_t,int level=0,bool onlyCopy=0)
+    : _Parameter(n,b,desc,level,onlyCopy),t(&_t) {}
+  virtual ~Parameter(){}
+  virtual bool setParameter(string s2,int verb)
+    { 
+      T x;  
+      if( !(*t==mConvert(s2,x)))
+	{
+	  bool printedFirst=0;
+	  if( verb>1 ) 
+	    {
+	      cout << "Parameter '"<<name <<"' changed from '"<<*t<<"' to '";
+	      printedFirst=1;
+	    }
+	  mConvert(s2,*t);
+	  if( printedFirst ) 
+	    cout << *t <<"'\n";
+	  setChanged();
+	  return 1;
+	} 
+      return 0;
+    }
+  virtual ostream&printAt(ostream&out)
+    {return out << name << " = " << *t << "  (" << description << ")";}
+  virtual ostream&printValue(ostream&out)
+    {return out << *t;}
+};
+
+typedef MP<_Parameter> ParPtr;
+
+class ParSet : public set<ParPtr>
+{
+ public:
+  void insert(const ParPtr&x)
+    {
+      if( count(x)!=0 )
+	cerr << "ERROR: element " << x->getString() << " already inserted.\n";
+      set<ParPtr>::insert(x);
+    }
+};
+
+bool makeSetCommand(string s1,string s2,const ParSet&pars,int verb=1,int level= -1);
+ostream&printPars(ostream&out,const ParSet&pars,int level=-1);
+bool writeParameters(ofstream&of,const ParSet&parset,int level=0);
+bool readParameters(ifstream&f,const ParSet&parset,int verb=2,int level=0);
+ParSet&getGlobalParSet();
+extern bool ParameterChangedFlag;
+template<class T>const T&addGlobalParameter(const char *name,const char *description,int level,T*adr,const T&init)
+{
+  *adr=init;
+  getGlobalParSet().insert(new Parameter<T>(name,ParameterChangedFlag,description,*adr,level));
+  return init;
+}
+template<class T>const T&addGlobalParameter(const char *name,const char *name2,const char *description,int level,T*adr,const T&init)
+{
+  *adr=init;
+  getGlobalParSet().insert(new Parameter<T>(name,ParameterChangedFlag,description,*adr,level));
+  getGlobalParSet().insert(new Parameter<T>(name2,ParameterChangedFlag,description,*adr,-1));
+  return init;
+}
+template<class T>const T&addGlobalParameter(const char *name,const char *name2,const char *name3,const char *description,int level,T*adr,const T&init)
+{
+  *adr=init;
+  getGlobalParSet().insert(new Parameter<T>(name,ParameterChangedFlag,description,*adr,level));
+  getGlobalParSet().insert(new Parameter<T>(name2,ParameterChangedFlag,description,*adr,-1));
+  getGlobalParSet().insert(new Parameter<T>(name3,ParameterChangedFlag,description,*adr,-1));
+  return init;
+}
+template<class T>const T&addGlobalParameter(const char *name,const char *name2,const char *name3,const char *name4,const char *description,int level,T*adr,const T&init)
+{
+  *adr=init;
+  getGlobalParSet().insert(new Parameter<T>(name,ParameterChangedFlag,description,*adr,level));
+  getGlobalParSet().insert(new Parameter<T>(name2,ParameterChangedFlag,description,*adr,-1));
+  getGlobalParSet().insert(new Parameter<T>(name3,ParameterChangedFlag,description,*adr,-1));
+  getGlobalParSet().insert(new Parameter<T>(name4,ParameterChangedFlag,description,*adr,-1));
+  return init;
+}
+void MakeParameterOptimizing(istream&file,string resultingParameters);
+
+#define GLOBAL_PARAMETER(TYP,VARNAME,NAME,DESCRIPTION,LEVEL,INIT) TYP VARNAME=addGlobalParameter< TYP >(NAME,DESCRIPTION,LEVEL,&VARNAME,INIT);
+#define GLOBAL_PARAMETER2(TYP,VARNAME,NAME,NAME2,DESCRIPTION,LEVEL,INIT) TYP VARNAME=addGlobalParameter< TYP >(NAME,NAME2,DESCRIPTION,LEVEL,&VARNAME,INIT);
+#define GLOBAL_PARAMETER3(TYP,VARNAME,NAME,NAME2,NAME3,DESCRIPTION,LEVEL,INIT) TYP VARNAME=addGlobalParameter< TYP >(NAME,NAME2,NAME3,DESCRIPTION,LEVEL,&VARNAME,INIT);
+#define GLOBAL_PARAMETER4(TYP,VARNAME,NAME,NAME2,NAME3,NAME4,DESCRIPTION,LEVEL,INIT) TYP VARNAME=addGlobalParameter< TYP >(NAME,NAME2,NAME3,NAME4,DESCRIPTION,LEVEL,&VARNAME,INIT);
+
+void setParameterLevelName(unsigned int i,string x);
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Perplexity.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Perplexity.cpp
@ -0,0 +1,42 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* Perplexity.cc
+ * =============
+ * Mike Jahr, 7/21/99
+ * Machine Translation group, WS99
+ * Center for Language and Speech Processing
+ * 
+ * Last Modified by: Yaser Al-Onaizan, August 17, 1999
+ *
+ * Simple class used to calculate cross entropy and perplexity
+ * of models.
+ */
+
+#include "Perplexity.h"
+
+void Perplexity::record(string model){
+  mutex.lock();
+  modelid.push_back(model);
+  perp.push_back(perplexity());
+  ce.push_back(cross_entropy());
+  mutex.unlock();
+}
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Perplexity.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Perplexity.h
@ -0,0 +1,115 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* Perplexity.h
+ * ============
+ * Mike Jahr, 7/15/99
+ * Machine Translation group, WS99
+ * Center for Language and Speech Processing
+ * 
+ * Last Modified by: Yaser Al-Onaizan, August 17, 1999
+ *
+ * Simple class used to calculate cross entropy and perplexity
+ * of models.
+ */
+
+#ifndef _PERPLEXITY_H
+#define _PERPLEXITY_H
+
+#include <cmath>
+#include <fstream>
+#include "Vector.h"
+#include "defs.h"
+#include "Array2.h"
+#include "Globals.h"
+#include "syncObj.h"
+
+#define CROSS_ENTROPY_BASE 2
+
+class Perplexity {
+ private:
+    double sum;
+    double wc;
+    Array2<double, Vector<double> > *E_M_L;
+    Vector<string> modelid;
+    Vector<double > perp;
+    Vector<double > ce;
+    Vector<string> name ;
+	Mutex mutex;
+ public:
+	~Perplexity() { delete E_M_L;}
+	Perplexity() {
+		E_M_L  = new Array2<double, Vector<double> >(MAX_SENTENCE_LENGTH,MAX_SENTENCE_LENGTH);
+		unsigned int l, m ;
+		Vector<double> fact(MAX_SENTENCE_LENGTH, 1.0);
+		for (m = 2 ; m < MAX_SENTENCE_LENGTH ; m++)
+			fact[m] = fact[m-1] * m ;
+		for (m = 1 ; m < MAX_SENTENCE_LENGTH ; m++)
+			for (l = 1 ; l < MAX_SENTENCE_LENGTH ; l++) {
+				(*E_M_L)(l, m) = log (pow((LAMBDA * l), double(m)) * exp(-LAMBDA * double(l)) / 
+									  (fact[m])) ;
+			}
+		sum = 0 ;
+		wc = 0;
+		perp.clear();
+		ce.clear();
+		name.clear();
+	}
+    inline void clear() {
+	  mutex.lock();
+      sum = 0 ;
+      wc = 0 ;
+	  mutex.unlock();
+    }
+    size_t size() const {return(min(perp.size(), ce.size()));}
+	inline void addFactor(const double p, const double count, const int l, 
+						  const int m,bool withPoisson) {
+		mutex.lock();
+		wc += count * m ; // number of french words 
+		sum += count * ( (withPoisson?((*E_M_L)(l, m)):0.0) + p) ;
+		mutex.unlock();
+	}
+    
+	inline double perplexity() const {
+		return exp( -1*sum / wc);
+    }
+
+    inline double cross_entropy() const {
+		return (-1.0*sum / (log(double(CROSS_ENTROPY_BASE)) * wc)); 
+    }
+
+    inline double word_count() const {
+		return wc;
+    }
+    
+    inline double getSum() const {
+		return sum ;
+    }
+
+    void record(string model);
+    
+    friend void generatePerplexityReport(const Perplexity&, const Perplexity&, 
+					 const Perplexity&, const Perplexity&, 
+					 ostream&, int, int, bool); 
+};
+
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Pointer.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Pointer.h
@ -0,0 +1,175 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef HEADER_Pointer_DEFINED
+#define HEADER_Pointer_DEFINED
+
+#include <cassert>
+#include <iostream>
+
+template<class T>
+class SmartPointer
+{
+ protected:
+  T*p;
+ public:
+  SmartPointer(T*_p=0) 
+    : p(_p) {}
+  inline T&operator*() const 
+    {return *p;}
+  inline T*operator->() const 
+    {return p;}
+  inline operator bool() const 
+    {return p!=0;}
+  inline T*ptr() const
+    { return p; }
+};
+template<class T> inline ostream &operator<<(ostream&out,const SmartPointer<T>&s)
+{if( s.ptr() )return out << *s;else return out <<"nullpointer";}
+
+
+template<class T>
+class SmartPointerConst
+{
+ protected:
+  const T*p;
+ public:
+  SmartPointerConst(const T*_p=0) 
+    : p(_p) {}
+  inline const T&operator*() const 
+    {return *p;}
+  inline const T*operator->() const 
+    {return p;}
+  inline operator bool() const
+    {return p!=0;}
+  inline const T*ptr() const
+    { return p; }
+};
+template<class T> inline ostream &operator<<(ostream&out,const SmartPointerConst<T>&s)
+{if( s.ptr() )return out << *s;else return out <<"nullpointer";}
+
+template <class T>
+class UP : public SmartPointer<T>
+{
+ public:
+  UP(T*_p=0) 
+    : SmartPointer<T>(_p) {}
+};
+template<class T> inline bool operator==(const UP<T>&s1,const UP<T>&s2)
+{return s1.ptr()==s2.ptr();}
+template<class T>  inline bool operator<(const UP<T>&s1,const UP<T>&s2)
+{return s1.ptr() < s2.ptr();}
+template<class T> inline int Hash(const UP<T> &wp)
+{if(wp.ptr())return Hash(*wp);else return 0;}
+
+
+template <class T>
+class UPConst : public SmartPointerConst<T>
+{
+ public:
+  UPConst(const T*_p=0) 
+    : SmartPointerConst<T>(_p) {}
+};
+template<class T> inline bool operator==(const UPConst<T>&s1,const UPConst<T>&s2)
+{return s1.ptr()==s2.ptr();}
+template<class T> inline bool operator<(const UPConst<T>&s1,const UPConst<T>&s2)
+{return s1.ptr()<s2.ptr();}
+template<class T> inline int Hash(const UPConst<T> &wp)
+{if(wp.ptr())return Hash(*wp);else return 0;}
+
+	
+template <class T>
+class MP : public SmartPointer<T>
+{
+ public:
+  MP(T*_p=0) 
+    : SmartPointer<T>(_p) {}
+};
+template <class T> inline bool operator==(const MP<T>&s1,const MP<T>&s2)
+{assert(s1);assert(s2);return *s1==*s2;}
+template <class T> inline bool operator<(const MP<T>&s1,const MP<T>&s2)
+{assert(s1);assert(s2);return *s1 < *s2;}
+template <class T> inline int Hash(const MP<T> &wp)
+{if(wp.ptr())return Hash(*wp);else return 0;}
+
+
+template <class T>
+class MPConst : public SmartPointerConst<T>
+{
+ public:
+  MPConst(const T*_p=0) 
+    : SmartPointerConst<T>(_p) {}
+};
+template <class T> inline bool operator==(const MPConst<T>&s1,const MPConst<T>&s2)
+{assert(s1);assert(s2);return *s1== *s2;}
+template <class T> inline bool operator<(const MPConst<T>&s1,const MPConst<T>&s2)
+{assert(s1);assert(s2);return *s1 < *s2;}
+template <class T> inline int Hash(const MPConst<T> &wp)
+{if(wp.ptr())return Hash(*wp);else return 0;}
+
+
+template <class T> 
+class DELP : public SmartPointer<T>
+{
+ private:
+  DELP(const DELP<T>&x);
+ public:
+  const DELP<T>&operator=(DELP<T>&x)
+  {
+    delete this->p;
+    this->p=x.p;x.p=0;
+    return *this;
+  }
+
+  ~DELP()
+    { delete this->p;this->p=0;}
+  DELP(T*_p=0) 
+    : SmartPointer<T>(_p) {}
+  void set(T*_p)
+    {
+      delete this->p;
+      this->p=_p;
+    }
+  friend bool operator==(const DELP<T>&s1,const DELP<T>&s2)
+    {
+      return *(s1.p)== *(s2.p);
+    }
+  friend bool operator<(const DELP<T>&s1,const DELP<T>&s2)
+    {
+      return *(s1.p) < *(s2.p);
+    }
+  friend inline int Hash(const DELP<T> &wp)
+    {
+      if(wp.p)
+	return Hash(*wp.p);
+      else 
+	return 0;
+    }
+};
+#endif
+
+
+
+
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/SetArray.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/SetArray.cpp
@ -0,0 +1,5 @@
+
+//#include "SetArray.h"
+
+#include "Parameter.h"
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/SetArray.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/SetArray.h
@ -0,0 +1,159 @@
+/*
+Array of set, for fast access of dictionary, and most important,
+be threadsafe
+*/
+
+
+#ifndef __SET_ARRAY_H__
+#define __SET_ARRAY_H__
+
+#include <map>
+#include <vector>
+#include "defs.h"
+#include "vocab.h"  
+#include <cstdio>
+#include <cstdlib>
+#include <pthread.h>
+#include "syncObj.h"
+
+template <class COUNT, class PROB>
+class LpPair {
+public:
+    COUNT count ;
+    PROB  prob ;
+public: // constructor 
+    LpPair():count(0), prob(0){} ;
+    LpPair(COUNT c, PROB p):count(c), prob(p){};
+} ;
+
+
+
+
+template <class COUNT, class PROB>
+class SetArray{
+public:
+         typedef LpPair<COUNT, PROB> CPPair;
+protected:
+    
+    /*Information stores here*/
+    std::vector<std::map<size_t,CPPair> > store;
+    std::vector<Mutex> muts;
+    size_t nEnglishWord;
+    size_t nFrenchWord;
+    void _init(){
+        store.resize(nEnglishWord);
+        muts.resize(nFrenchWord);
+    }
+    
+public:
+       
+    /*
+        Get reference, not creating
+    */
+    CPPair* find(size_t fi, size_t si){
+        /*HERE: lock, unlock after we get the pointer*/
+        muts[fi].lock();
+        /* Sync-ed */
+        std::map<size_t,CPPair>& w = store[fi];
+        typename std::map<size_t,CPPair>::iterator it = w.find((size_t)si);
+        CPPair* q = ( it!=store[fi].end() ? &(it->second) : 0);
+//        for(it = w.begin(); it!=w.end();it++){
+ //           cout << it->first << endl;
+ //       }
+        /* End Synced*/
+        muts[fi].unlock();
+        return q;
+    };
+    
+    /*
+        Get reference, creating it
+    */
+    inline CPPair& findRef(size_t fi, size_t si){
+        std::map<size_t,CPPair> &x = store[fi];
+        muts[fi].lock();
+        /* Sync-ed */
+        CPPair& ref= x[si];
+        /* End Synced */
+        muts[fi].unlock();
+    };
+
+    
+    void insert(size_t fi, size_t si, COUNT count = 0, PROB prob = 0){
+        muts[fi].lock();
+        /*Syced*/
+        std::map<size_t,CPPair> &x = store[fi];
+        CPPair& v= x[si];
+        v.count = count;
+        v.prob = prob;
+        muts[fi].unlock();
+    }
+    
+    void incCount(size_t e, size_t f, COUNT inc) 
+        // increments the count of the given word pair. if the pair does not exist, 
+        // it creates it with the given value.
+        {
+            if( inc ){
+                std::map<size_t,CPPair> &x = store[e];
+                muts[e].lock();
+                CPPair& ref= x[f];
+                ref.count += inc;
+                muts[e].unlock();
+            }
+        }
+
+    PROB getProb(size_t e, size_t f) const
+        // read probability value for P(fj/ei) from the hash table 
+    // if pair does not exist, return floor value PROB_SMOOTH
+    {
+        muts[e].lock();
+        typename std::map<size_t,CPPair >::const_iterator it = store[e].find(f);
+        PROB b;
+        if(it == store[e].end())  
+            b = PROB_SMOOTH; 
+        else
+            b=max((it->second).prob, PROB_SMOOTH);
+        muts[e].unlock();
+        return b;
+    }
+    
+    COUNT getCount(size_t e, size_t f) const
+        /* read count value for entry pair (fj/ei) from the hash table */
+    {
+        muts[e].lock();
+        typename std::map<size_t,CPPair >::const_iterator it = store[e].find(f);
+        COUNT c;
+        if(it == store[e].end())  
+            c = 0; 
+        else
+            c = ((*it).second).count;
+        muts[e].unlock();
+    }
+    
+    void erase(size_t e, size_t f)
+        // In: a source and a target token ids.
+        // removes the entry with that pair from table
+    {
+        muts[e].lock();   
+        store[e].erase(f);
+        muts[e].unlock();
+    };
+    
+    inline void setNumberOfEnlish(size_t e){nEnglishWord=e;_init();};
+    inline void setNumberOfFrench(size_t f){nFrenchWord = f;};
+    
+    const std::map<size_t,CPPair>& getMap(size_t i) const{
+        return store[i];
+    }
+    
+    std::map<size_t,CPPair>& getMap1(size_t i){
+        return store[i];
+    }
+    
+    SetArray(size_t e, size_t f): nEnglishWord(e), nFrenchWord(f){
+        _init();
+    }
+};
+
+
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/TTables.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/TTables.cpp
@ -0,0 +1,177 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+ 
+*/
+#include "TTables.h"
+#include "Parameter.h"
+#include<iostream>
+#include <fstream>
+
+GLOBAL_PARAMETER(float,PROB_CUTOFF,"PROB CUTOFF","Probability cutoff threshold for lexicon probabilities",PARLEV_OPTHEUR,1e-7);
+GLOBAL_PARAMETER2(float, COUNTINCREASE_CUTOFF,"COUNTINCREASE CUTOFF","countCutoff","Counts increment cutoff threshold",PARLEV_OPTHEUR,1e-6);
+
+
+/* ------------------ Method Definiotns for Class tmodel --------------------*/
+
+
+// To output to STDOUT, submit filename as NULL
+template <class COUNT, class PROB>
+void tmodel<COUNT, PROB>::printCountTable(const char *filename, 
+					 const Vector<WordEntry>& evlist, 
+					 const Vector<WordEntry>& fvlist,
+					 const bool actual) const
+{
+	ostream *tof;
+	
+	if(filename)
+		tof = new ofstream(filename);
+	else
+		tof = & cout;
+	
+	ostream &of = *tof;
+	/*  for(unsigned int i=0;i<es.size()-1;++i)
+	for(unsigned int j=es[i];j<es[i+1];++j)
+	{
+	const CPPair&x=fs[j].second;
+	WordIndex e=i,f=fs[j].first;
+	if( actual )
+	of << evlist[e].word << ' ' << fvlist[f].word << ' ' << x.prob << '\n';
+	else
+	of << e << ' ' << f << ' ' << x.prob << '\n';
+	}*/
+	for(unsigned int i=0;i<lexmat.size();++i){
+		if( lexmat[i] ){
+			for(unsigned int j=0;j<lexmat[i]->size();++j)
+			{                        
+				const CPPair&x=(*lexmat[i])[j].second;
+				WordIndex e=i,f=(*lexmat[i])[j].first;
+				if( x.prob>MINCOUNTINCREASE ){
+					if( actual ){
+						of << evlist[e].word << ' ' << fvlist[f].word << ' ' << x.count << '\n';
+					}else{
+						of << e << ' ' << f << ' ' << x.count << '\n';
+					}
+				}
+			}
+		}
+	}
+	
+	if(filename){
+		((ofstream*)tof)->close();
+		delete tof;
+	}
+}
+
+template <class COUNT, class PROB>
+void tmodel<COUNT, PROB>::printProbTable(const char *filename, 
+					 const Vector<WordEntry>& evlist, 
+					 const Vector<WordEntry>& fvlist,
+					 const bool actual) const
+{
+	ofstream of(filename);
+	/*  for(unsigned int i=0;i<es.size()-1;++i)
+	for(unsigned int j=es[i];j<es[i+1];++j)
+	{
+	const CPPair&x=fs[j].second;
+	WordIndex e=i,f=fs[j].first;
+	if( actual )
+	of << evlist[e].word << ' ' << fvlist[f].word << ' ' << x.prob << '\n';
+	else
+	of << e << ' ' << f << ' ' << x.prob << '\n';
+	}*/
+	for(unsigned int i=0;i<lexmat.size();++i){
+		if( lexmat[i] ){
+			for(unsigned int j=0;j<lexmat[i]->size();++j)
+			{                        
+				const CPPair&x=(*lexmat[i])[j].second;
+				WordIndex e=i,f=(*lexmat[i])[j].first;
+				if( x.prob>PROB_SMOOTH ){
+					if( actual ){
+						of << evlist[e].word << ' ' << fvlist[f].word << ' ' << x.prob << '\n';
+					}else{
+						of << e << ' ' << f << ' ' << x.prob << '\n';
+					}
+				}
+			}
+		}
+	}
+}
+
+template <class COUNT, class PROB>
+void tmodel<COUNT, PROB>::printProbTableInverse(const char *, 
+				   const Vector<WordEntry>&, 
+				   const Vector<WordEntry>&, 
+				   const double, 
+				   const double, 
+				   const bool ) const
+{
+}
+template <class COUNT, class PROB>
+void tmodel<COUNT, PROB>::normalizeTable(const vcbList&, const vcbList&, int)
+{
+    for(unsigned int i=0;i<lexmat.size();++i){
+        double c=0.0;
+        if( lexmat[i] ){
+            unsigned int lSize=lexmat[i]->size();
+            for(unsigned int j=0;j<lSize;++j)
+                c+=(*lexmat[i])[j].second.count;
+            for(unsigned int j=0;j<lSize;++j)  {
+                if( c==0 )
+                    (*lexmat[i])[j].second.prob=1.0/(lSize);
+                else
+                    (*lexmat[i])[j].second.prob=(*lexmat[i])[j].second.count/c;
+                (*lexmat[i])[j].second.count=0;
+            }
+        }
+    }
+}
+
+template <class COUNT, class PROB>
+bool tmodel<COUNT, PROB>::readProbTable(const char *filename){
+	/* This function reads the t table from a file.
+	 Each line is of the format:  source_word_id target_word_id p(target_word|source_word)
+	 This is the inverse operation of the printTable function.
+	 NAS, 7/11/99
+	 */
+	ifstream inf(filename);
+	cerr << "Reading t prob. table from " << filename << "\n";
+	if (!inf) {
+		cerr << "\nERROR: Cannot open " << filename << "\n";
+		return false;
+	}
+	WordIndex src_id, trg_id;
+	PROB prob;
+	int nEntry=0;
+	while (inf >> src_id >> trg_id >> prob) {
+		insert(src_id, trg_id, 0.0, prob);
+		nEntry++;
+	}
+	cerr << "Read " << nEntry << " entries in prob. table.\n";
+	return true;
+}
+
+
+
+template class tmodel<COUNT,PROB> ; 
+
+/* ---------------- End of Method Definitions of class tmodel ---------------*/
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/TTables.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/TTables.h
@ -0,0 +1,330 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* --------------------------------------------------------------------------*
+ *                                                                           *
+ * Module : TTables                                                          *
+ *                                                                           *
+ * Prototypes File: TTables.h                                               *
+ *                                                                           *
+ * Objective: Defines clases and methods for handling I/O for Probability &  *
+ *            Count tables and also alignment tables                         *
+ *****************************************************************************/
+
+#ifndef _ttables_h
+#define _ttables_h 1
+
+
+#include "defs.h"
+#include "vocab.h"  
+
+#include <cassert>
+ 
+#include <iostream>
+#include <algorithm>
+#include <functional>
+#include <map>
+#include <set>
+#include "Vector.h"
+#include <utility>
+#include "syncObj.h"
+
+#if __GNUC__>2
+#include <ext/hash_map>
+using __gnu_cxx::hash_map;
+#else
+#include <hash_map>
+#endif
+
+#include <fstream>
+
+#include "Globals.h"
+
+
+/* The tables defined in the following classes are defined as hash tables. For
+   example. the t-table is a hash function of a word pair; an alignment is 
+   a hash function of a vector of integer numbers (sentence positions) and so
+   on   */
+
+
+/*----------- Defnition of Hash Function for class tmodel ------- -----------*/
+
+typedef pair<WordIndex, WordIndex> wordPairIds;
+
+
+class hashpair : public unary_function< pair<WordIndex, WordIndex>, size_t >
+{
+public:
+  size_t operator() (const pair<WordIndex, WordIndex>& key) const
+    {
+      return (size_t) MAX_W*key.first + key.second; /* hash function and it 
+						       is guarnteed to have 
+						       unique id for each 
+						       unique pair */
+    }
+};
+
+
+
+/* ------------------ Class Prototype Definitions ---------------------------*
+  Class Name: tmodel
+  Objective: This defines the underlying data structur for t Tables and t 
+  Count Tables. They are defined as a hash table. Each entry in the hash table
+  is the probability (P(fj/ei) ) or count collected for ( C(fj/ei)). The 
+  probability and the count are represented as log integer probability as 
+  defined by the class LogProb .  
+
+  This class is used to represents t Tables (probabiliity) and n (fertility 
+  Tables and also their corresponding count tables .
+ 
+ *---------------------------------------------------------------------------*/
+
+//typedef float COUNT ;
+//typedef LogProb PROB ;
+template <class COUNT, class PROB>
+class LpPair {
+public:
+    COUNT count ;
+    PROB  prob ;
+public: // constructor 
+    LpPair():count(0), prob(0){} ;
+    LpPair(COUNT c, PROB p):count(c), prob(p){};
+} ;
+
+template<class T>
+T*mbinary_search(T*x,T*y,unsigned int val)
+{
+  if( y-x==0 )
+    return 0;
+  if( x->first==val)
+    return x;
+  if( y-x<2 )
+    return 0;
+  T*mid=x+(y-x)/2;
+  if( val < mid->first )
+    return mbinary_search(x,mid,val);
+  else
+    return mbinary_search(mid,y,val);
+  
+}
+
+template<class T>
+const T*mbinary_search(const T*x,const T*y,unsigned int val)
+{
+  if( y-x==0 )
+    return 0;
+  if( x->first==val)
+    return x;
+  if( y-x<2 )
+    return 0;
+  const T*mid=x+(y-x)/2;
+  if( val < mid->first )
+    return mbinary_search(x,mid,val);
+  else
+    return mbinary_search(mid,y,val);
+  
+}
+
+template <class COUNT, class PROB>
+class tmodel{
+	typedef LpPair<COUNT, PROB> CPPair;
+public:
+	bool recordDiff;
+        
+public:
+	int noEnglishWords;  // total number of unique source words
+	int noFrenchWords;   // total number of unique target words
+	//vector<pair<unsigned int,CPPair> > fs;
+    //vector<unsigned int> es;
+    vector< vector<pair<unsigned int,CPPair> >* > lexmat;
+	vector< Mutex > mutex;
+      
+    void erase(WordIndex e, WordIndex f){
+		CPPair *p=find(e,f);
+		if(p)
+			*p=CPPair(0,0);
+	};
+      
+    CPPair*find(int e,int f){
+		//pair<unsigned int,CPPair> *be=&(fs[0])+es[e];
+		//pair<unsigned int,CPPair> *en=&(fs[0])+es[e+1];
+		if(e>lexmat.size()||lexmat[e]==NULL){
+			return NULL;
+		}
+		pair<unsigned int,CPPair> *be=&(*lexmat[e])[0];
+		pair<unsigned int,CPPair> *en=&(*lexmat[e])[0]+(*lexmat[e]).size();
+		pair<unsigned int,CPPair> *x= mbinary_search(be,en,f);
+		if( x==0 ){
+			//cerr << "A:DID NOT FIND ENTRY: " << e << " " << f << '\n';
+			//abort();
+			return 0;
+		}
+		return &(x->second);
+	}
+      
+	const CPPair*find(int e,int f)const{
+		if(lexmat[e]==0)
+			return 0;
+        const pair<unsigned int,CPPair> *be=&(*lexmat[e])[0];
+		const pair<unsigned int,CPPair> *en=&(*lexmat[e])[0]+(*lexmat[e]).size();
+		//const pair<unsigned int,CPPair> *be=&(fs[0])+es[e];
+		//const pair<unsigned int,CPPair> *en=&(fs[0])+es[e+1];
+		const pair<unsigned int,CPPair> *x= mbinary_search(be,en,f);
+		if( x==0 ){
+			//cerr << "B:DID NOT FIND ENTRY: " << e << " " << f << '\n';
+			//abort();
+			return 0;
+		}
+            
+		return &(x->second);
+	}
+public:
+	void insert(WordIndex e, WordIndex f, COUNT cval=0.0, PROB pval = 0.0){
+		CPPair* found = find(e,f);
+		if(found)
+			*found=CPPair(cval,pval);
+	}
+      
+    CPPair*getPtr(int e,int f){return find(e,f);}
+
+	tmodel(){};
+    tmodel(const string&fn)	{
+		recordDiff = false;
+		int count=0,count2=0;
+		ifstream infile2(fn.c_str());
+		cerr << "Inputfile in " << fn << endl;
+		int e,f,olde=-1,oldf=-1;
+		pair<unsigned int,CPPair> cp;
+		vector< pair<unsigned int,CPPair> > cps;
+		while(infile2>>e>>f){
+			cp.first=f;
+			assert(e>=olde);
+			assert(e>olde ||f>oldf);
+			if( e!=olde&&olde>=0 ){
+				int oldsize=lexmat.size();
+				lexmat.resize(olde+1);
+				for(unsigned int i=oldsize;i<lexmat.size();++i)
+					lexmat[i]=0;
+				lexmat[olde]=new vector< pair<unsigned int,CPPair> > (cps);
+				cps.clear();
+				if( !((*lexmat[olde]).size()==(*lexmat[olde]).capacity()) )
+					cerr << "eRROR: waste of memory: " << (*lexmat[olde]).size() << " " << (*lexmat[olde]).capacity() << endl;
+				count2+=lexmat[olde]->capacity();
+			}
+			cps.push_back(cp);
+			olde=e;
+			oldf=f;
+			count++;
+		}
+		lexmat.resize(olde+1);
+		lexmat[olde]=new vector< pair<unsigned int,CPPair> > (cps);
+		count2+=lexmat[olde]->capacity();      
+		cout << "There are " << count << " " << count2 << " entries in table" << '\n';
+		mutex.resize(lexmat.size());
+		/* Create mutex */
+	}
+
+
+  /*  tmodel(const string&fn)
+    {
+      size_t count=0;
+      {
+	ifstream infile1(fn.c_str());
+	if( !infile1 )
+	  {
+	    cerr << "ERROR: can't read coocurrence file " << fn << '\n';
+	    abort();
+	  }
+	int e,f;
+	while(infile1>>e>>f)
+	  count++;
+      }
+      cout << "There are " << count << " entries in table" << '\n';
+      ifstream infile2(fn.c_str());
+      fs.resize(count);
+      int e,f,olde=-1,oldf=-1;
+      pair<unsigned int,CPPair> cp;
+      count=0;
+      while(infile2>>e>>f)
+	{
+	  assert(e>=olde);
+	  assert(e>olde ||f>oldf);
+	  if( e!=olde )
+	    {
+	      es.resize(e+1);
+	      for(unsigned int i=olde+1;int(i)<=e;++i)
+		es[i]=count;
+	    }
+	  cp.first=f;
+	  assert(count<fs.size());
+	  fs[count]=cp;
+	  //fs.push_back(cp);
+	  olde=e;
+	  oldf=f;
+	  count++;
+	}
+      assert(count==fs.size());
+      es.push_back(fs.size());
+      cout << fs.size() << " " << count << " coocurrences read" << '\n';
+      }*/
+  
+    void incCount(WordIndex e, WordIndex f, COUNT inc) {
+        if( inc ){
+            CPPair *p=find(e,f);
+            if( p ){
+				mutex[e].lock();
+				p->count += inc ;
+				mutex[e].unlock();
+			}
+        }
+    }
+
+	PROB getProb(WordIndex e, WordIndex f) const{
+		const CPPair *p=find(e,f);
+        if( p )
+            return max(p->prob, PROB_SMOOTH);
+        else
+            return PROB_SMOOTH;
+    }
+	
+	COUNT getCount(WordIndex e, WordIndex f) const
+	{
+		const CPPair *p=find(e,f);
+		if( p )
+			return p->count;
+		else
+			return 0.0;
+    }
+
+  void printProbTable(const char* filename, const Vector<WordEntry>&, const Vector<WordEntry>&,bool actual) const;
+  void printCountTable(const char* filename, const Vector<WordEntry>&, const Vector<WordEntry>&,bool actual) const;
+  void printProbTableInverse(const char *filename, 
+			     const Vector<WordEntry>& evlist, 
+			     const Vector<WordEntry>& fvlist, 
+			     const double eTotal, 
+			     const double fTotal, 
+			     const bool actual = false ) const;
+  void normalizeTable(const vcbList&engl, const vcbList&french, int iter=2);
+  bool readProbTable(const char *filename);
+  bool readSubSampledProbTable(const char* filename, std::set<WordIndex> &e, std::set<WordIndex> &f);
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Vector.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/Vector.h
@ -0,0 +1,423 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/*--
+Vector: checked vector implementation
+
+Franz Josef Och (30/07/99)
+--*/
+#ifndef ARRAY_H_DEFINED
+#define ARRAY_H_DEFINED
+#include "mystl.h"
+#include <algorithm>
+#include <string>
+#include <utility>
+#include <functional>
+#include <cassert>
+
+
+#ifdef NDEBUG
+
+#include <vector>
+#define Vector vector
+template<class T> ostream& operator<<(ostream&o, const Vector<T>&a)
+{
+  o << "Vector(" << a.size() << "){ ";
+  for(unsigned int iii=0;iii<a.size();iii++)
+    o << " " << iii<< ": " << a[iii]<<" ;";
+  return o << "}\n";
+}
+
+#else
+
+#define ARRAY_DEBUG
+#define memo_del(a, b)
+#define memo_new(a)
+
+template<class T> class Vector
+{
+private:
+	T *p;                  	
+	int realSize; 
+	int maxWritten;
+	
+	void copy(T *a, const T *b, int n);
+	void copy(T *a, T *b, int n);
+	void _expand();		
+public:
+  Vector() 
+    : p(0), realSize(0), maxWritten(-1)
+    {
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY: " << this<<" "<<(void*)p << '\n';
+#endif
+    }
+  Vector(const Vector<T> &x)
+    : p(new T[x.maxWritten+1]), realSize(x.maxWritten+1), maxWritten(x.maxWritten)
+    {
+      memo_new(p);
+      copy(p, x.p, realSize);
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY copy: " << this << " " << realSize <<" "<<(void*)p<< '\n';
+#endif
+    }
+  explicit Vector(int n)
+    : p(new T[n]), realSize(n), maxWritten(n-1)
+    {
+      memo_new(p);
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY with parameter n: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+    }
+  Vector(int n, const T&_init)
+    : p(new T[n]), realSize(n), maxWritten(n-1)
+    {
+      memo_new(p);
+      for(int iii=0;iii<n;iii++)p[iii]=_init;
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY with parameter n and init: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+    }
+  
+  ~Vector() 
+    { 
+#ifdef VERY_ARRAY_DEBUG
+      cout << "FREE ARRAY: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+      delete [] p;
+      memo_del(p, 1);
+#ifndef NDEBUG
+      p=0;realSize=-1;maxWritten=-1;
+#endif
+    }
+  
+  Vector<T>& operator=(const Vector<T>&x)
+    {
+      if( this!= &x )
+	{
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "FREE ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif	
+	  delete [] p;
+	  memo_del(p, 1);
+	  realSize = x.maxWritten+1;
+	  maxWritten = x.maxWritten;
+	  p = new T[realSize]; 
+	  memo_new(p);
+	  copy(p, x.p, realSize);
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "NEW ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+	}
+      return *this;
+    }
+  
+  Vector<T>& operator=(Vector<T>&x)
+    {
+      if( this!= &x )
+	{
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "FREE ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+	  delete [] p;
+	  memo_del(p, 1);
+	  realSize = x.maxWritten+1;
+	  maxWritten = x.maxWritten;
+	  p = new T[realSize]; 
+	  memo_new(p);
+	  copy(p, x.p, realSize);
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "NEW ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+	}
+      return *this;
+    }
+  
+  void allowAccess(int n) 
+    { 
+      while( realSize<=n )
+	_expand(); 
+      maxWritten=max(maxWritten, n);
+      assert( maxWritten<realSize );
+    }
+  void resize(int n)
+    {
+      while( realSize<n ) 
+	_expand(); 
+      maxWritten=n-1;
+    }
+  void clear()
+    {
+      resize(0);
+    }
+  void reserve(int n)
+    {
+      int maxOld=maxWritten;
+      resize(n);
+      maxWritten=maxOld;
+    }
+  void sort(int until=-1)
+    {
+      if( until== -1 ) until=size();
+      std::sort(p, p+until);
+    }
+  void invsort(int until=-1)
+    {
+      if( until== -1 ) until=size();
+      std::sort(p, p+until, greater<T>());      
+    }
+  void init(int n, const T&_init)
+    {
+#ifdef VERY_ARRAY_DEBUG
+      cout << "FREE ARRAY because of init: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+      delete []p;
+      memo_del(p, 1);
+      p=new T[n];
+      memo_new(p);
+      realSize=n;
+      maxWritten=n-1;
+      for(int iii=0;iii<n;iii++)p[iii]=_init;
+#ifdef VERY_ARRAY_DEBUG
+      cout << "NEW ARRAY because of init: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+    }
+  inline unsigned int size() const
+    {assert( maxWritten<realSize );
+    return maxWritten+1;}
+  inline int low() const
+    { return 0; }
+  inline int high() const
+    { return maxWritten; }
+  int findMax() const;
+  int findMin() const;
+  void errorAccess(int n) const;
+  inline T*getPointerToData(){return p;}
+  inline T*begin(){return p;}
+  inline T*end(){return p+maxWritten+1;}
+  inline T& operator[](int n)
+    { 
+#ifndef NDEBUG
+      if( n<0 || n>maxWritten )
+	errorAccess(n);
+#endif
+      return p[n];
+    }
+  inline const T& operator[](int n) const 
+    { 
+#ifndef NDEBUG
+      if(n<0 || n>maxWritten )
+	errorAccess(n);
+#endif
+      return p[n]; 
+    }
+  inline const T& get(int n) const 
+    { 
+#ifndef NDEBUG
+      if(n<0 || n>maxWritten )
+	errorAccess(n);
+#endif      
+      return p[n]; 
+    }
+  const T&top(int n=0) const
+    {return (*this)[maxWritten-n];}
+  T&top(int n=0)
+    {return (*this)[maxWritten-n];}
+  const T&back(int n=0) const
+    {return (*this)[maxWritten-n];}
+  T&back(int n=0)
+    {return (*this)[maxWritten-n];}
+  T&push_back(const T&x)
+    {     
+      allowAccess(maxWritten+1);
+      (*this)[maxWritten]=x;
+      return top();
+    }
+  bool writeTo(ostream&out) const
+    {
+      out << "Vector ";
+      out << size() << " ";
+      //out << a << '\n';
+      for(int iv=0;iv<=maxWritten;iv++)
+	{
+	  writeOb(out, (*this)[iv]);
+	  out << '\n';
+	}
+      return 1;
+    }
+  bool readFrom(istream&in)
+    {
+      string s;
+      if( !in )
+	{
+	  cerr << "ERROR(Vector): file cannot be opened.\n";
+	  return 0;
+	}
+      in >> s;
+      if( !(s=="Vector") )
+	{
+	  cerr << "ERROR(Vector): Vector!='"<<s<<"'\n";
+	  return 0;
+	}
+      int biggest;
+      in >> biggest;
+     // in >> a;
+      resize(biggest);
+      for(int iv=0;iv<size();iv++)
+	{
+	  readOb(in, (*this)[iv]);
+	}
+      return 1;
+    }
+};
+
+template<class T> bool operator==(const Vector<T> &x, const Vector<T> &y)
+{
+  if( &x == &y )
+    return 1;
+  else
+    {
+      if( y.size()!=x.size() )
+	return 0;
+      else
+	{
+	  for(unsigned int iii=0;iii<x.size();iii++)
+	    if( !(x[iii]==y[iii]) )
+	      return 0;
+	  return 1;
+	}
+    }
+}
+template<class T> bool operator!=(const Vector<T> &x, const Vector<T> &y)
+{
+  return !(x==y);
+}
+
+template<class T> bool operator<(const Vector<T> &x, const Vector<T> &y)
+{
+  if( &x == &y )
+    return 0;
+  else
+    {
+      if( y.size()<x.size() )
+	return !(y<x);
+      for(int iii=0;iii<x.size();iii++)
+	{
+	  assert( iii!=y.size() );
+	  if( x[iii]<y[iii] )
+	    return 1;
+	  else if( y[iii]<x[iii] )
+	    return 0;
+	}
+      return x.size()!=y.size();//??
+    }
+}
+
+
+template<class T> void Vector<T>:: errorAccess(int n) const
+{
+  cerr 	<< "ERROR: Access to array element " << n 
+	<< " (" << maxWritten << ", " << realSize << ", " << (void*)p << ")\n";
+  cout <<  "ERROR: Access to array element " << n 
+       << " (" << maxWritten << ", " << realSize << ", " << (void*)p << ")\n";
+  assert(0);
+#ifndef DEBUG
+  abort();
+#endif
+}
+
+template<class T> ostream& operator<<(ostream&o, const Vector<T>&a)
+{
+  o << "Vector(" << a.size() << "){ ";
+  for(unsigned int iii=0;iii<a.size();iii++)
+    o << " " << iii<< ": " << a[iii]<<" ;";
+  return o << "}\n";
+}
+
+template<class T> istream& operator>>(istream&in, Vector<T>&)
+{return in;}
+
+template<class T> int Hash(const Vector<T>&a)
+{
+  int n=0;
+  for(int iii=0;iii<a.size();iii++)
+    n+=Hash(a[iii])*(iii+1);
+  return n+a.size()*47;
+}
+template<class T> void Vector<T>::copy(T *aa, const T *bb, int n)
+{
+  for(int iii=0;iii<n;iii++)
+    aa[iii]=bb[iii];
+}
+template<class T> void Vector<T>::copy(T *aa, T *bb, int n)
+{
+  for(int iii=0;iii<n;iii++)
+    aa[iii]=bb[iii];
+}
+
+template<class T> void Vector<T>::_expand()
+{
+#ifdef VERY_ARRAY_DEBUG
+  cout << "FREE ARRAY because of _expand: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+  T *oldp=p;
+  int oldsize=realSize;
+  realSize=realSize*2+1;
+  p=new T[realSize];
+  memo_new(p);
+  copy(p, oldp, oldsize);
+  delete [] oldp;
+  memo_del(oldp, 1);
+#ifdef VERY_ARRAY_DEBUG
+  cout << "NEW ARRAY because of _expand: " << this << " " << realSize<<" "<<(void*)p << '\n';
+#endif			
+}
+
+template<class T> int Vector<T>::findMax() const
+{
+  if( size()==0 )
+    return -1;
+  else
+    {
+      int maxPos=0;
+      for(int iii=1;iii<size();iii++)
+	if( (*this)[maxPos]<(*this)[iii] )
+	  maxPos=iii;
+      return maxPos;
+    }
+}
+template<class T> int Vector<T>::findMin() const
+{
+  if( size()==0 )
+    return -1;
+  else
+    {
+      int minPos=0;
+      for(int iii=1;iii<size();iii++)
+	if( (*this)[iii]<(*this)[minPos] )
+	  minPos=iii;
+      return minPos;
+    }
+}
+
+#endif
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/WordClasses.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/WordClasses.h
@ -0,0 +1,103 @@
+/*
+
+Copyright (C) 2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef WordClasses_h_DEFINED
+#define WordClasses_h_DEFINED
+#include <map>
+#include <string>
+#include <set>
+#include "vocab.h"
+
+class WordClasses
+{
+ private:
+  map<string,string> Sw2c;
+  map<string,int> Sc2int;
+  Vector<string> Sint2c;
+  Vector<int> w2c;
+  unsigned int classes;
+ public:
+  WordClasses() 
+    : classes(1) 
+    {
+      Sint2c.push_back("0");
+      Sc2int["0"]=0;
+    }
+  template<class MAPPER> bool read(istream&in,const MAPPER&m,const vcbList& vcb)
+    {
+      string sline;
+      int maxword=0;
+	  int readWord=0, putWord=0;
+      while(getline(in,sline))
+	  {
+		readWord ++;
+	    string word,wclass;
+	    istrstream iline(sline.c_str());
+	    iline>>word>>wclass;
+	    
+        if( !Sc2int.count(wclass) )
+	    {
+	      Sc2int[wclass]=classes++;
+	      Sint2c.push_back(wclass);
+	      assert(classes==Sint2c.size());
+	    }
+		if(vcb.has_word(word)){
+			maxword=max(m(word),maxword);
+			assert(Sw2c.count(word)==0);
+			Sw2c[word]=wclass;
+			putWord++;
+		}
+	  }
+      w2c=Vector<int>(maxword+1,0);
+      for(map<string,string>::const_iterator i=Sw2c.begin();i!=Sw2c.end();++i)
+			w2c[m(i->first)]=Sc2int[i->second];
+      cout << "Read classes: #words: " << maxword << " " << " #classes: "<< classes <<endl;
+	  cout << "Actual number of read words: " << readWord << " stored words: " << putWord << endl;
+      return 1;
+    }
+  int getClass(int w)const
+    {
+      if(w>=0&&int(w)<int(w2c.size()) )
+	return w2c[w];
+      else
+	return 0;
+    }
+  int operator()(const string&x)const
+    {
+      if( Sc2int.count(x) )
+	return Sc2int.find(x)->second;
+      else
+	{
+	  cerr << "WARNING:  class " << x << " not found.\n";
+	  return 0;
+	}
+    }
+  string classString(unsigned int cnr)const
+    {
+      if( cnr<Sint2c.size())
+	return Sint2c[cnr];
+      else
+	return string("0");
+    }
+};
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/alignment.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/alignment.cpp
@ -0,0 +1,38 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/*--
+alignment: 'checked' alignment representation with automatic calculation
+           of fertilities
+Franz Josef Och (30/07/99)
+--*/
+#include "alignment.h"
+
+ostream&operator<<(ostream&out, const alignment&a)
+{
+  int m=a.a.size()-1,l=a.f.size()-1;
+  out << "AL(l:"<<l<<",m:"<<m<<")(a: ";
+  for(int j=1;j<=m;j++)out << a(j) << ' ';
+  out << ")(fert: ";
+  for(int i=0;i<=l;i++)out << a.fert(i) << ' ';
+  return out << ")  c:"<<"\n";
+}
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/alignment.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/alignment.h
@ -0,0 +1,227 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/*--
+alignment: 'checked' alignment representation with autom. calc. of fertilities
+Franz Josef Och (30/07/99)
+--*/
+#ifndef alignment_h_fjo_defined
+#define alignment_h_fjo_defined
+#include "Vector.h"
+#include <cassert>
+#include "defs.h"
+#include "myassert.h"
+
+class al_struct
+{
+ public:
+  al_struct()
+    : prev(0),next(0){}
+  PositionIndex prev,next;
+};
+
+
+class alignment
+{
+ private:
+  Vector<PositionIndex> a;
+  Vector<PositionIndex> positionSum,f;
+ public:
+  Vector<PositionIndex> als_i;
+  Vector<al_struct>  als_j;
+  PositionIndex l,m;
+  alignment()
+    {}
+  alignment(PositionIndex _l, PositionIndex _m)
+    : a(_m+1, (PositionIndex)0),
+    positionSum(_l+1, (PositionIndex)0), f(_l+1, (PositionIndex)0), als_i(_l+1,0),als_j(_m+1),l(_l), m(_m)
+    {
+      f[0]=m;
+      for(PositionIndex j=1;j<=m;j++)
+	{
+	  if( j>1 )
+	    als_j[j].prev= j-1;
+	  if( j<m )
+	    als_j[j].next= j+1;
+	}
+      als_i[0]=1;
+    }
+  PositionIndex get_l()const
+    {return l;}
+  PositionIndex get_m()const
+    {return m;}
+  void doMove(int i,int j)
+    {
+      set(j,i);
+    }
+  void doSwap(int j1,int j2)
+    {
+      int aj1=a[j1],aj2=a[j2];
+      set(j1,aj2);
+      set(j2,aj1);
+    }
+  void set(PositionIndex j, PositionIndex aj)
+    {
+      PositionIndex old_aj=a[j];
+      massert(j<a.size());massert(aj<f.size());
+      massert(old_aj<f.size());massert(f[old_aj]>0);
+      massert(j>0);
+      positionSum[old_aj]-=j;
+      // ausfuegen
+      PositionIndex prev=als_j[j].prev;
+      PositionIndex next=als_j[j].next;
+      if( next )
+	als_j[next].prev=prev;
+      if( prev )
+	als_j[prev].next=next;
+      else
+	als_i[old_aj]=next;
+      
+      // neue Position suchen
+      PositionIndex lfd=als_i[aj],llfd=0;
+      while( lfd && lfd<j )
+	lfd = als_j[llfd=lfd].next;
+
+      // einfuegen
+      als_j[j].prev=llfd;
+      als_j[j].next=lfd;
+      if( llfd )
+	als_j[llfd].next=j;
+      else
+	als_i[aj]=j;
+      if( lfd )
+	als_j[lfd].prev=j;
+
+      f[old_aj]--;
+      positionSum[aj]+=j;
+      f[aj]++;
+      a[j]=aj;
+    }
+  const Vector<PositionIndex>& getAlignment() const 
+    {return a ;}
+  PositionIndex get_al(PositionIndex j)const
+    {
+      massert(j<a.size());
+      return a[j];
+    }
+  PositionIndex operator()(PositionIndex j)const
+    {
+      massert(j<a.size());
+      return a[j];
+    }
+  PositionIndex fert(PositionIndex i)const
+    {
+      massert(i<f.size());
+      return f[i];
+    }
+  PositionIndex get_head(PositionIndex i)const
+    {
+      massert( als_i[i]==_get_head(i) );
+      return als_i[i];
+    }
+  PositionIndex get_center(PositionIndex i)const
+    {
+      if( i==0 )return 0;
+      massert(((positionSum[i]+f[i]-1)/f[i]==_get_center(i)));
+      return (positionSum[i]+f[i]-1)/f[i];
+    }
+  PositionIndex _get_head(PositionIndex i)const
+    {
+      if( fert(i)==0 )return 0;
+      for(PositionIndex j=1;j<=m;j++)
+	if( a[j]==i )
+	  return j;
+      return 0;
+    }
+  PositionIndex _get_center(PositionIndex i)const
+    {
+      if( i==0 )return 0;
+      massert(fert(i));
+      PositionIndex sum=0;
+      for(PositionIndex j=1;j<=m;j++)
+	if( a[j]==i )
+	  sum+=j;
+      return (sum+fert(i)-1)/fert(i);
+    }
+  PositionIndex prev_cept(PositionIndex i)const
+    {
+      if( i==0 )return 0;
+      PositionIndex k=i-1;
+      while(k&&fert(k)==0)
+	k--;
+      return k;
+    }
+  PositionIndex next_cept(PositionIndex i)const
+    {
+      PositionIndex k=i+1;
+      while(k<l+1&&fert(k)==0)
+	k++;
+      return k;
+    }
+  PositionIndex prev_in_cept(PositionIndex j)const
+    {
+      //PositionIndex k=j-1;
+      //while(k&&a[k]!=a[j])
+      //k--;
+      //assert( als_j[j].prev==k );
+      //assert(k);
+      //return k;
+      massert(als_j[j].prev==0||a[als_j[j].prev]==a[j]);
+      return als_j[j].prev;
+    }
+  friend ostream &operator<<(ostream&out, const alignment&a);
+  friend bool operator==(const alignment&a, const alignment&b)
+    {
+      massert(a.a.size()==b.a.size());
+      for(PositionIndex j=1;j<=a.get_m();j++)
+	if(a(j)!=b(j))
+	  return 0;
+      return 1;
+    }
+  friend bool operator<(const alignment&x, const alignment&y)
+    {
+      massert(x.get_m()==y.get_m());
+      for(PositionIndex j=1;j<=x.get_m();j++)
+	if( x(j)<y(j) ) 
+	  return 1;
+	else if( y(j)<x(j) )
+	  return 0;
+      return 0;
+    }
+  friend int differences(const alignment&x, const alignment&y){
+    int count=0;
+    massert(x.get_m()==y.get_m());
+    for(PositionIndex j=1;j<=x.get_m();j++)
+      count += (x(j)!=y(j));
+    return count;
+  }
+  bool valid()const
+    {
+      if( 2*f[0]>m )
+	return 0;
+      for(unsigned int i=1;i<=l;i++)
+	if( f[i]>=MAX_FERTILITY )
+	  return 0;
+      return 1;
+    }
+  friend class transpair_model5;
+};
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/cmd.c
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/cmd.c
@ -0,0 +1,649 @@
+
+// $Id: cmd.c 1307 2007-03-14 22:22:36Z hieuhoang1972 $
+
+#include	<stdio.h>
+#include	<stdlib.h>
+#include	<ctype.h>
+#include	<string.h>
+
+#include	"cmd.h"
+
+#ifdef WIN32
+#		define popen	_popen
+#		define pclose _pclose
+#endif
+
+static Enum_T	BoolEnum[] = {
+	{	"FALSE",	0	},
+	{	"TRUE",		1	},
+	{	0,		0	}
+};
+
+#ifdef	NEEDSTRDUP
+char	*strdup();
+#endif
+
+#define	FALSE	0
+#define	TRUE	1
+
+#define	LINSIZ		10240
+#define	MAXPARAM	256
+
+static char	*GetLine(),
+		**str2array();
+static int	Scan(),
+		SetParam(),
+		SetEnum(),
+		SetSubrange(),
+		SetStrArray(),
+		SetGte(),
+		SetLte(),
+		CmdError(),
+		EnumError(),
+		SubrangeError(),
+		GteError(),
+		LteError(),
+		PrintParam(),
+		PrintEnum(),
+		PrintStrArray();
+
+static Cmd_T	cmds[MAXPARAM+1];
+static char	*SepString = " \t\n";
+
+#if defined(__STDC__)
+#include	<stdarg.h>
+int DeclareParams(char *ParName, ...)
+#else
+#include	<varargs.h>
+int DeclareParams(ParName, va_alist)
+char	*ParName;
+va_dcl
+#endif
+{
+	va_list		args;
+	static int	ParamN = 0;
+	int		j,
+			c;
+	char		*s;
+
+#if defined(__STDC__)
+	va_start(args, ParName);
+#else
+	va_start(args);
+#endif
+	for(;ParName;) {
+		if(ParamN==MAXPARAM) {
+			fprintf(stderr, "Too many parameters !!\n");
+			break;
+		}
+		for(j=0,c=1; j<ParamN&&(c=strcmp(cmds[j].Name,ParName))<0; j++)
+			;
+		if(!c) {
+			fprintf(stderr,
+				"Warning: parameter \"%s\" declared twice.\n",
+				ParName);
+		}
+		for(c=ParamN; c>j; c--) {
+			cmds[c] = cmds[c-1];
+		}
+		cmds[j].Name = ParName;
+		cmds[j].Type = va_arg(args, int);
+		cmds[j].Val = va_arg(args, void *);
+		switch(cmds[j].Type) {
+		case CMDENUMTYPE:	/* get the pointer to Enum_T struct  */
+			cmds[j].p = va_arg(args, void *);
+			break;
+		case CMDSUBRANGETYPE:	/* get the two extremes		     */
+			cmds[j].p = (void*) calloc(2, sizeof(int));
+			((int*)cmds[j].p)[0] = va_arg(args, int);
+			((int*)cmds[j].p)[1] = va_arg(args, int);
+			break;
+		case CMDGTETYPE:	/* get lower or upper bound	     */
+		case CMDLTETYPE:
+			cmds[j].p = (void*) calloc(1, sizeof(int));
+			((int*)cmds[j].p)[0] = va_arg(args, int);
+			break;
+		case CMDSTRARRAYTYPE:	/* get the separators string	     */
+			cmds[j].p = (s=va_arg(args, char*))
+				    ? (void*)strdup(s) : 0;
+			break;
+		case CMDBOOLTYPE:
+			cmds[j].Type = CMDENUMTYPE;
+			cmds[j].p = BoolEnum;
+			break;
+		case CMDDOUBLETYPE:	/* nothing else is needed	     */
+		case CMDINTTYPE:
+		case CMDSTRINGTYPE:
+			break;
+		default:
+			fprintf(stderr, "%s: %s %d %s \"%s\"\n",
+				"DeclareParam()", "Unknown Type",
+				cmds[j].Type, "for parameter", cmds[j].Name);
+			exit(1);
+		}
+		ParamN++;
+		ParName = va_arg(args, char *);
+	}
+	cmds[ParamN].Name = NULL;
+	va_end(args);
+	return 0;
+}
+
+int GetParams(n, a, CmdFileName)
+int	*n;
+char	***a;
+char	*CmdFileName;
+{
+	char	*Line,
+		*ProgName;
+	int	argc = *n;
+	char	**argv = *a,
+		*s;
+	FILE	*fp;
+	int	IsPipe;
+
+#ifdef	MSDOS
+#define	PATHSEP '\\'
+	char	*dot = NULL;
+#else
+#define	PATHSEP '/'
+#endif
+
+	if(!(Line=malloc(LINSIZ))) {
+		fprintf(stderr, "GetParams(): Unable to alloc %d bytes\n",
+			LINSIZ);
+		exit(1);
+	}
+	if((ProgName=strrchr(*argv, PATHSEP))) {
+		++ProgName;
+	} else {
+		ProgName = *argv;
+	}
+#ifdef	MSDOS
+	if(dot=strchr(ProgName, '.')) *dot = 0;
+#endif
+	--argc;
+	++argv;
+	for(;;) {
+		if(argc && argv[0][0]=='-' && argv[0][1]=='=') {
+			CmdFileName = argv[0]+2;
+			++argv;
+			--argc;
+		}
+		if(!CmdFileName) {
+			break;
+		}
+		IsPipe = !strncmp(CmdFileName, "@@", 2);
+		fp = IsPipe
+		     ? popen(CmdFileName+2, "r")
+		     : strcmp(CmdFileName, "-")
+		       ? fopen(CmdFileName, "r")
+		       : stdin;
+		if(!fp) {
+			fprintf(stderr, "Unable to open command file %s\n",
+				CmdFileName);
+			exit(1);
+		}
+		while(GetLine(fp, LINSIZ, Line) && strcmp(Line, "\\End")) {
+			if(Scan(ProgName, cmds, Line)) {
+				CmdError(Line);
+			}
+		}
+		if(fp!=stdin) {
+			if(IsPipe) pclose(fp); else fclose(fp);
+		}
+		CmdFileName = NULL;
+	}
+	while(argc && **argv=='-' && (s=strchr(*argv, '='))) {
+		*s = ' ';
+		sprintf(Line, "%s/%s", ProgName, *argv+1);
+		*s = '=';
+		if(Scan(ProgName, cmds, Line)) CmdError(*argv);
+		--argc;
+		++argv;
+	}
+	*n = argc;
+	*a = argv;
+#ifdef MSDOS
+	if(dot) *dot = '.';
+#endif
+	free(Line);
+	return 0;
+}
+
+int PrintParams(ValFlag, fp)
+int	ValFlag;
+FILE	*fp;
+{
+	int	i;
+
+	fflush(fp);
+	if(ValFlag) {
+		fprintf(fp, "Parameters Values:\n");
+	} else {
+		fprintf(fp, "Parameters:\n");
+	}
+	for(i=0; cmds[i].Name; i++) PrintParam(cmds+i, ValFlag, fp);
+	fprintf(fp, "\n");
+	fflush(fp);
+	return 0;
+}
+
+int SPrintParams(a, pfx)
+char	***a,
+	*pfx;
+{
+	int	l,
+		n;
+	Cmd_T	*cmd;
+
+	if(!pfx) pfx="";
+	l = strlen(pfx);
+	for(n=0, cmd=cmds; cmd->Name; cmd++) n += !!cmd->ArgStr;
+	a[0] = calloc(n, sizeof(char*));
+	for(n=0, cmd=cmds; cmd->Name; cmd++) {
+		if(!cmd->ArgStr) continue;
+		a[0][n] = malloc(strlen(cmd->Name)+strlen(cmd->ArgStr)+l+2);
+		sprintf(a[0][n], "%s%s=%s", pfx, cmd->Name, cmd->ArgStr);
+		++n;
+	}
+	return n;
+}
+
+static int CmdError(opt)
+char	*opt;
+{
+	fprintf(stderr, "Invalid option \"%s\"\n", opt);
+	fprintf(stderr, "This program expectes the following parameters:\n");
+	PrintParams(FALSE, stderr);
+	exit(0);
+}
+
+static int PrintParam(cmd, ValFlag, fp)
+Cmd_T	*cmd;
+int	ValFlag;
+FILE	*fp;
+{
+	fprintf(fp, "%4s", "");
+	switch(cmd->Type) {
+	case CMDDOUBLETYPE:
+		fprintf(fp, "%s", cmd->Name);
+		if(ValFlag) fprintf(fp, ": %22.15e", *(double *)cmd->Val);
+		fprintf(fp, "\n");
+		break;
+	case CMDENUMTYPE:
+		PrintEnum(cmd, ValFlag, fp);
+		break;
+	case CMDINTTYPE:
+	case CMDSUBRANGETYPE:
+	case CMDGTETYPE:
+	case CMDLTETYPE:
+		fprintf(fp, "%s", cmd->Name);
+		if(ValFlag) fprintf(fp, ": %d", *(int *)cmd->Val);
+		fprintf(fp, "\n");
+		break;
+	case CMDSTRINGTYPE:
+		fprintf(fp, "%s", cmd->Name);
+		if(ValFlag) {
+			if(*(char **)cmd->Val) {
+				fprintf(fp, ": \"%s\"", *(char **)cmd->Val);
+			} else {
+				fprintf(fp, ": %s", "NULL");
+			}
+		}
+		fprintf(fp, "\n");
+		break;
+	case CMDSTRARRAYTYPE:
+		PrintStrArray(cmd, ValFlag, fp);
+		break;
+	default:
+		fprintf(stderr, "%s: %s %d %s \"%s\"\n",
+			"PrintParam",
+			"Unknown Type",
+			cmd->Type,
+			"for parameter",
+			cmd->Name);
+		exit(1);
+	}
+	return 0;
+}
+
+static char *GetLine(fp, n, Line)
+FILE	*fp;
+int	n;
+char	*Line;
+{
+	int	j,
+		l,
+		offs=0;
+
+	for(;;) {
+		if(!fgets(Line+offs, n-offs, fp)) {
+			return NULL;
+		}
+		if(Line[offs]=='#') continue;
+		l = strlen(Line+offs)-1;
+		Line[offs+l] = 0;
+		for(j=offs; Line[j] && isspace(Line[j]); j++, l--)
+			;
+		if(l<1) continue;
+		if(j > offs) {
+			char	*s = Line+offs,
+				*q = Line+j;
+
+			while((*s++=*q++))
+				;
+		}
+		if(Line[offs+l-1]=='\\') {
+			offs += l;
+			Line[offs-1] = ' ';
+		} else {
+			break;
+		}
+	}
+	return Line;
+}
+
+static int Scan(ProgName, cmds, Line)
+char	*ProgName,
+	*Line;
+Cmd_T	*cmds;
+{
+	char	*q,
+		*p;
+	int	i,
+		hl,
+		HasToMatch = FALSE,
+		c0,
+		c;
+
+	p = Line+strspn(Line, SepString);
+	if(!(hl=strcspn(p, SepString))) {
+		return 0;
+	}
+	if((q=strchr(p, '/')) && q-p<hl) {
+		*q = 0;
+		if(strcmp(p, ProgName)) {
+			*q = '/';
+			return 0;
+		}
+		*q = '/';
+		HasToMatch=TRUE;
+		p = q+1;
+	}
+	if(!(hl = strcspn(p, SepString))) {
+		return 0;
+	}
+	c0 = p[hl];
+	p[hl] = 0;
+	for(i=0, c=1; cmds[i].Name&&(c=strcmp(cmds[i].Name, p))<0; i++)
+		;
+	p[hl] = c0;
+	if(!c) return SetParam(cmds+i, p+hl+strspn(p+hl, SepString));
+	return HasToMatch && c;
+}
+
+static int SetParam(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	if(!*s && cmd->Type != CMDSTRINGTYPE) {
+		fprintf(stderr,
+			"WARNING: No value specified for parameter \"%s\"\n",
+			cmd->Name);
+		return 0;
+	}
+	switch(cmd->Type) {
+	case CMDDOUBLETYPE:
+		if(sscanf(s, "%lf", (double*)cmd->Val)!=1) {
+			fprintf(stderr,
+				"Float value required for parameter \"%s\"\n",
+				cmd->Name);
+			exit(1);
+		}
+		break;
+	case CMDENUMTYPE:
+		SetEnum(cmd, s);
+		break;
+	case CMDINTTYPE:
+		if(sscanf(s, "%d", (int*)cmd->Val)!=1) {
+			fprintf(stderr,
+				"Integer value required for parameter \"%s\"\n",
+				cmd->Name);
+			exit(1);
+		}
+		break;
+	case CMDSTRINGTYPE:
+		*(char **)cmd->Val = (strcmp(s, "<NULL>") && strcmp(s, "NULL"))
+				     ? strdup(s)
+				     : 0;
+		break;
+	case CMDSTRARRAYTYPE:
+		SetStrArray(cmd, s);
+		break;
+	case CMDGTETYPE:
+		SetGte(cmd, s);
+		break;
+	case CMDLTETYPE:
+		SetLte(cmd, s);
+		break;
+	case CMDSUBRANGETYPE:
+		SetSubrange(cmd, s);
+		break;
+	default:
+		fprintf(stderr, "%s: %s %d %s \"%s\"\n",
+			"SetParam",
+			"Unknown Type",
+			cmd->Type,
+			"for parameter",
+			cmd->Name);
+		exit(1);
+	}
+	cmd->ArgStr = strdup(s);
+	return 0;
+}
+
+static int SetEnum(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	Enum_T	*en;
+
+	for(en=(Enum_T *)cmd->p; en->Name; en++) {
+		if(*en->Name && !strcmp(s, en->Name)) {
+			*(int *) cmd->Val = en->Idx;
+			return 0;
+		}
+	}
+	return EnumError(cmd, s);
+}
+
+static int SetSubrange(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	int	n;
+
+	if(sscanf(s, "%d", &n)!=1) {
+		fprintf(stderr,
+			"Integer value required for parameter \"%s\"\n",
+			cmd->Name);
+		exit(1);
+	}
+	if(n < *(int *)cmd->p || n > *((int *)cmd->p+1)) {
+		return SubrangeError(cmd, n);
+	}
+	*(int *)cmd->Val = n;
+	return 0;
+}
+
+static int SetGte(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	int	n;
+
+	if(sscanf(s, "%d", &n)!=1) {
+		fprintf(stderr,
+			"Integer value required for parameter \"%s\"\n",
+			cmd->Name);
+		exit(1);
+	}
+	if(n<*(int *)cmd->p) {
+		return GteError(cmd, n);
+	}
+	*(int *)cmd->Val = n;
+	return 0;
+}
+
+static int SetStrArray(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	*(char***)cmd->Val = str2array(s, (char*)cmd->p);
+	return 0;
+}
+
+static int SetLte(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	int	n;
+
+	if(sscanf(s, "%d", &n)!=1) {
+		fprintf(stderr,
+			"Integer value required for parameter \"%s\"\n",
+			cmd->Name);
+		exit(1);
+	}
+	if(n > *(int *)cmd->p) {
+		return LteError(cmd, n);
+	}
+	*(int *)cmd->Val = n;
+	return 0;
+}
+
+static int EnumError(cmd, s)
+Cmd_T	*cmd;
+char	*s;
+{
+	Enum_T	*en;
+
+	fprintf(stderr,
+		"Invalid value \"%s\" for parameter \"%s\"\n", s, cmd->Name);
+	fprintf(stderr, "Valid values are:\n");
+	for(en=(Enum_T *)cmd->p; en->Name; en++) {
+		if(*en->Name) {
+			fprintf(stderr, "    %s\n", en->Name);
+		}
+	}
+	fprintf(stderr, "\n");
+	exit(1);
+}
+
+static int GteError(cmd, n)
+Cmd_T	*cmd;
+int	n;
+{
+	fprintf(stderr,
+		"Value %d out of range for parameter \"%s\"\n", n, cmd->Name);
+	fprintf(stderr, "Valid values must be greater than or equal to  %d\n",
+		*(int *)cmd->p);
+	exit(1);
+}
+
+static int LteError(cmd, n)
+Cmd_T	*cmd;
+int	n;
+{
+	fprintf(stderr,
+		"Value %d out of range for parameter \"%s\"\n", n, cmd->Name);
+	fprintf(stderr, "Valid values must be less than or equal to  %d\n",
+		*(int *)cmd->p);
+	exit(1);
+}
+
+static int SubrangeError(cmd, n)
+Cmd_T	*cmd;
+int	n;
+{
+	fprintf(stderr,
+		"Value %d out of range for parameter \"%s\"\n", n, cmd->Name);
+	fprintf(stderr, "Valid values range from %d to %d\n",
+		*(int *)cmd->p, *((int *)cmd->p+1));
+	exit(1);
+}
+
+static int PrintEnum(cmd, ValFlag, fp)
+Cmd_T	*cmd;
+int	ValFlag;
+FILE	*fp;
+{
+	Enum_T	*en;
+
+	fprintf(fp, "%s", cmd->Name);
+	if(ValFlag) {
+		for(en=(Enum_T *)cmd->p; en->Name; en++) {
+			if(*en->Name && en->Idx==*(int *)cmd->Val) {
+				fprintf(fp, ": %s", en->Name);
+			}
+		}
+	}
+	fprintf(fp, "\n");
+	return 0;
+}
+
+static int PrintStrArray(cmd, ValFlag, fp)
+Cmd_T	*cmd;
+int	ValFlag;
+FILE	*fp;
+{
+	char	*indent,
+		**s = *(char***)cmd->Val;
+	int	l = 4+strlen(cmd->Name);
+
+	fprintf(fp, "%s", cmd->Name);
+	indent = malloc(l+2);
+	memset(indent, ' ', l+1);
+	indent[l+1] = 0;
+	if(ValFlag) {
+		fprintf(fp, ": %s", s ? (*s ? *s++ : "NULL") : "");
+		if(s) while(*s) {
+			fprintf(fp, "\n%s %s", indent, *s++);
+		}
+	}
+	free(indent);
+	fprintf(fp, "\n");
+	return 0;
+}
+
+static char **str2array(s, sep)
+char	*s,
+	*sep;
+{
+	char	*p,
+		**a;
+	int	n = 0,
+		l;
+
+	if(!sep) sep = SepString;
+	p = s += strspn(s, sep);
+	while(*p) {
+		p += strcspn(p, sep);
+		p += strspn(p, sep);
+		++n;
+	}
+	a = calloc(n+1, sizeof(char *));
+	p = s;
+	n = 0;
+	while(*p) {
+		l = strcspn(p, sep);
+		a[n] = malloc(l+1);
+		memcpy(a[n], p, l);
+		a[n][l] = 0;
+		++n;
+		p += l;
+		p += strspn(p, sep);
+	}
+	return a;
+}
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/cmd.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/cmd.h
@ -0,0 +1,51 @@
+
+// $Id: cmd.h 1307 2007-03-14 22:22:36Z hieuhoang1972 $
+
+#if !defined(CMD_H)
+
+#define	CMD_H
+
+#define	CMDDOUBLETYPE	1
+#define	CMDENUMTYPE	2
+#define	CMDINTTYPE	3
+#define	CMDSTRINGTYPE	4
+#define	CMDSUBRANGETYPE	5
+#define	CMDGTETYPE	6
+#define	CMDLTETYPE	7
+#define	CMDSTRARRAYTYPE	8
+#define	CMDBOOLTYPE	9
+
+typedef struct {
+	char	*Name;
+	int	Idx;
+} Enum_T;
+
+typedef struct {
+	int	Type;
+	char	*Name,
+		*ArgStr;
+	void	*Val,
+		*p;
+} Cmd_T;
+
+#ifdef  __cplusplus
+extern "C" {
+#endif
+
+#if defined(__STDC__)
+int DeclareParams(char *, ...);
+#else
+int DeclareParams();
+#endif
+
+int	GetParams(int *n, char ***a,char *CmdFileName),
+	SPrintParams(),
+	PrintParams();
+
+#ifdef  __cplusplus
+}
+#endif
+#endif
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/collCounts.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/collCounts.cpp
@ -0,0 +1,315 @@
+/*
+
+ Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+ This file is part of GIZA++ ( extension of GIZA ).
+
+ This program is free software; you can redistribute it and/or
+ modify it under the terms of the GNU General Public License
+ as published by the Free Software Foundation; either version 2
+ of the License, or (at your option) any later version.
+
+ This program is distributed in the hope that it will be useful, 
+ but WITHOUT ANY WARRANTY; without even the implied warranty of
+ MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+ GNU General Public License for more details.
+
+ You should have received a copy of the GNU General Public License
+ along with this program; if not, write to the Free Software
+ Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+ USA.
+
+ */
+#include "alignment.h"
+#include "transpair_model3.h"
+#include <map>
+#include "collCounts.h"
+#include "MoveSwapMatrix.h"
+#include "D5Tables.h"
+#include "transpair_model5.h"
+#include "transpair_modelhmm.h"
+#include "Parameter.h"
+
+extern float COUNTINCREASE_CUTOFF_AL;
+// unifies collectCountsOverAlignments and findAlignmentNeighborhood FJO-20/07/99
+template<class TRANSPAIR> int collectCountsOverNeighborhood(
+		const MoveSwapMatrix<TRANSPAIR>&msc, LogProb ascore,
+		Array2<LogProb,Vector<LogProb> >&dtcount,
+		Array2<LogProb,Vector<LogProb> >&ncount, LogProb&p1count,
+		LogProb&p0count, LogProb&total_count) {
+	int nAl=0;
+	const PositionIndex l=msc.get_l(), m=msc.get_m();
+	Array2<LogProb,Vector<LogProb> > cmove(l+1, m+1), cswap(l+1, m+1);
+	Vector<LogProb> negmove(m+1),negswap(m+1),plus1fert(l+1),minus1fert(l+1);
+	LogProb total_move, total_swap;
+	if (msc.isCenterDeleted()==0) {
+		total_move+=ascore;
+		nAl++;
+	}
+	for (PositionIndex j=1; j<=m; j++) {
+		for (PositionIndex i=0; i<=l; i++) {
+			if (msc(j)!=i && !msc.isDelMove(i, j) ) {
+				double cm = msc.cmove(i, j);
+				if(cm<0)
+					continue;
+				LogProb newscore=ascore*cm;
+				total_move+=newscore;
+				nAl++;
+				cmove(i, j)+=newscore;
+				negmove[j]+=newscore;
+				plus1fert[i]+=newscore;
+				minus1fert[msc(j)]+=newscore;
+			}
+		}
+	}
+	for (PositionIndex j1=1; j1<=m; j1++) {
+		for (PositionIndex j2=j1+1; j2<=m; j2++) {
+			if (msc(j1)!=msc(j2) && !msc.isDelSwap(j1, j2) ) {
+				double cs = msc.cswap(j1, j2);
+				if(cs < 0){
+					continue;
+				}
+				LogProb newscore=ascore*cs;
+				total_swap+=newscore;
+				nAl++;
+				cswap(msc(j1), j2)+=newscore;
+				cswap(msc(j2), j1)+=newscore;
+				negswap[j1]+=newscore;
+				negswap[j2]+=newscore;
+			}
+		}
+	}
+	total_count+=total_move+total_swap;
+	for (PositionIndex j=1; j<=m; j++)
+		for (PositionIndex i=0; i<=l; i++)
+			dtcount(i, j) += ((i==msc(j)) ? (total_count
+					-(negmove[j]+negswap[j])) : (cswap(i, j)+cmove(i, j)));
+	for (PositionIndex i=1; i<=l; i++) {
+		LogProb temp=minus1fert[i]+plus1fert[i];
+		if (msc.fert(i)<MAX_FERTILITY)
+			ncount(i, msc.fert(i))+=total_count-temp;
+		if (msc.fert(i)>0&&msc.fert(i)-1<MAX_FERTILITY)
+			ncount(i, msc.fert(i)-1)+=minus1fert[i];
+		else if (minus1fert[i]!=0.0)
+			cerr << "ERROR: M1Fa: " << minus1fert[i] << ' ' << i << ' '
+					<< msc.fert(i)<< endl;
+		if (msc.fert(i)+1<MAX_FERTILITY)
+			ncount(i, msc.fert(i)+1)+=plus1fert[i];
+	}
+	LogProb temp=minus1fert[0]+plus1fert[0];
+	p1count += (total_count-temp)*(LogProb)msc.fert(0);
+	p0count += (total_count-temp)*(LogProb)(m-2*msc.fert(0));
+	if (msc.fert(0)>0) {
+		p1count += (minus1fert[0])*(LogProb)(msc.fert(0)-1);
+		p0count += (minus1fert[0])*(LogProb)(m-2*(msc.fert(0)-1));
+	} else if (minus1fert[0]!=0.0)
+		cerr << "ERROR: M1Fb: " << minus1fert[0] << endl;
+	if (int(m)-2*(int(msc.fert(0))+1)>=0) {
+		p1count += (plus1fert[0])*(LogProb)(msc.fert(0)+1);
+		p0count += (plus1fert[0])*(LogProb)(m-2*(msc.fert(0)+1));
+	}
+	msc.check();
+	return nAl;
+}
+;
+
+template<class TRANSPAIR> double collectCountsOverNeighborhoodForSophisticatedModels(
+		const MoveSwapMatrix<TRANSPAIR>&, LogProb, void*) {
+	return 0.0;
+}
+
+template<class TRANSPAIR> void _collectCountsOverNeighborhoodForSophisticatedModels(
+		const MoveSwapMatrix<TRANSPAIR>&Mmsc, const alignment&msc,
+		const TRANSPAIR&ef, LogProb normalized_ascore, d4model*d4Table) {
+	Mmsc.check();
+	const PositionIndex m=msc.get_m(), l=msc.get_l();
+	for (PositionIndex j=1; j<=m; ++j)
+		if (msc(j)!=0)
+			if (msc.get_head(msc(j))==j) {
+				int ep=msc.prev_cept(msc(j));
+				d4Table->augCountRef_first(j, msc.get_center(ep),
+						d4Table->ewordclasses->getClass(ef.get_es(ep)),
+						d4Table->fwordclasses->getClass(ef.get_fs(j)), l, m,normalized_ascore);
+			} else {
+				//massert( &d4Table->getCountRef_bigger(j,msc.prev_in_cept(j),0,d4Table->fwordclasses.getClass(ef.get_fs(j)),l,m) == ef.getCountSecond(j,msc.prev_in_cept(j) ));
+				d4Table->augCountRef_bigger(j, msc.prev_in_cept(j), 0,
+						d4Table->fwordclasses->getClass(ef.get_fs(j)), l, m,normalized_ascore);
+			}
+}
+
+template<class TRANSPAIR> void _collectCountsOverNeighborhoodForSophisticatedModels(
+		const MoveSwapMatrix<TRANSPAIR>&Mmsc, const alignment&msc,
+		const TRANSPAIR&ef, LogProb normalized_ascore, d5model*d5Table) {
+	Mmsc.check();
+	_collectCountsOverNeighborhoodForSophisticatedModels(Mmsc, msc, ef,
+			normalized_ascore, &d5Table->d4m);
+	Mmsc.check();
+	const PositionIndex m=msc.get_m(), l=msc.get_l();
+	PositionIndex prev_cept=0;
+	PositionIndex vac_all=m;
+	Vector<char> vac(m+1,0);
+	for (PositionIndex i=1; i<=l; i++) {
+		PositionIndex cur_j=msc.als_i[i];
+		PositionIndex prev_j=0;
+		PositionIndex k=0;
+		if (cur_j) { // process first word of cept
+			k++;
+			d5Table->getCountRef_first(vacancies(vac, cur_j), vacancies(vac,
+					msc.get_center(prev_cept)),
+					d5Table->fwordclasses->getClass(ef.get_fs(cur_j)), l, m,
+					vac_all-msc.fert(i)+k) +=normalized_ascore;
+			vac_all--;
+			assert(vac[cur_j]==0);
+			vac[cur_j]=1;
+			Mmsc.check();
+			prev_j=cur_j;
+			cur_j=msc.als_j[cur_j].next;
+		}
+		while (cur_j) { // process following words of cept
+			k++;
+			int vprev=vacancies(vac, prev_j);
+			d5Table->getCountRef_bigger(vacancies(vac, cur_j), vprev,
+					d5Table->fwordclasses->getClass(ef.get_fs(cur_j)), l, m,
+					vac_all-vprev/*war weg*/-msc.fert(i)+k)+=normalized_ascore;
+			vac_all--;
+			vac[cur_j]=1;
+			Mmsc.check();
+			prev_j=cur_j;
+			cur_j=msc.als_j[cur_j].next;
+		}
+		assert(k==msc.fert(i));
+		if (k)
+			prev_cept=i;
+	}
+	assert(vac_all==msc.fert(0));
+}
+
+extern int NumberOfAlignmentsInSophisticatedCountCollection;
+template<class TRANSPAIR, class MODEL> double collectCountsOverNeighborhoodForSophisticatedModels(
+		const MoveSwapMatrix<TRANSPAIR>&msc, LogProb normalized_ascore,
+		MODEL*d5Table) {
+	const PositionIndex m=msc.get_m(), l=msc.get_l();
+	alignment x(msc);
+	double sum=0;
+	msc.check();
+	if ( !msc.isCenterDeleted() ) {
+		_collectCountsOverNeighborhoodForSophisticatedModels<TRANSPAIR>(msc, x,
+				msc.get_ef(), normalized_ascore, d5Table);
+		NumberOfAlignmentsInSophisticatedCountCollection++;
+		sum+=normalized_ascore;
+	}
+	msc.check();
+	for (WordIndex j=1; j<=m; j++)
+		for (WordIndex i=0; i<=l; i++) {
+			WordIndex old=x(j);
+			if (i!=old&& !msc.isDelMove(i, j) ) {
+				msc.check();
+				double cm =msc.cmove(i, j);
+				if(cm < 0){
+					continue;
+				}
+				double c=cm*normalized_ascore;
+				if (c > COUNTINCREASE_CUTOFF_AL) {
+					x.set(j, i);
+					_collectCountsOverNeighborhoodForSophisticatedModels<
+							TRANSPAIR>(msc, x, msc.get_ef(), c, d5Table);
+					NumberOfAlignmentsInSophisticatedCountCollection++;
+					x.set(j, old);
+					sum+=c;
+				}
+				msc.check();
+			}
+		}
+	for (PositionIndex j1=1; j1<=m; j1++) {
+		for (PositionIndex j2=j1+1; j2<=m; j2++) {
+			if (msc(j1)!=msc(j2) && !msc.isDelSwap(j1, j2) ) {
+				double cs = msc.cswap(j1, j2);
+				if(cs < 0)
+					continue;
+				double c=cs*normalized_ascore;
+				msc.check();
+				if (c > COUNTINCREASE_CUTOFF_AL) {
+					int old1=msc(j1), old2=msc(j2);
+					x.set(j1, old2);
+					x.set(j2, old1);
+					_collectCountsOverNeighborhoodForSophisticatedModels<
+							TRANSPAIR>(msc, x, msc.get_ef(), c, d5Table);
+					NumberOfAlignmentsInSophisticatedCountCollection++;
+					x.set(j1, old1);
+					x.set(j2, old2);
+					sum+=c;
+				}
+				msc.check();
+			}
+		}
+	}
+	msc.check();
+	return sum;
+}
+
+template<class TRANSPAIR, class MODEL> int collectCountsOverNeighborhood(
+		const Vector<pair<MoveSwapMatrix<TRANSPAIR>*,LogProb> >&smsc,
+		Vector<WordIndex>&es, Vector<WordIndex>&fs, tmodel<COUNT,PROB>&tTable,
+		amodel<COUNT>&aCountTable, amodel<COUNT>&dCountTable,
+		nmodel<COUNT>&nCountTable, SyncDouble&p1count, SyncDouble&p0count,
+		LogProb&_total, float count, bool addCounts, MODEL*d4Table) {
+	int nAl=0;
+	const PositionIndex l=es.size()-1, m=fs.size()-1;
+	Array2<LogProb,Vector<LogProb> > dtcount(l+1, m+1), ncount(l+1,
+			MAX_FERTILITY+1);
+	LogProb p0=0, p1=0, all_total=0;
+	for (unsigned int i=0; i<smsc.size(); ++i) {
+		LogProb this_total=0;
+		nAl+=collectCountsOverNeighborhood(*smsc[i].first, smsc[i].second,
+				dtcount, ncount, p1, p0, this_total);
+		all_total+=this_total;
+	}
+	_total=all_total;
+	if(count==0){
+		cerr << "WARNING: COUNT ==0" << endl;
+	}else
+		all_total/=(double)count;
+	if(isinf(all_total)){
+		cerr << "ALL_TOTAL is INF\n" ;
+		return 0;
+	}
+	double sum2=0;
+	if (addCounts && d4Table) {
+		for (unsigned int i=0; i<smsc.size(); ++i) {
+			//for(WordIndex j=1;j<=m;j++)for(WordIndex ii=0;ii<=l;ii++)
+			//  (*smsc[i].first).cmove(ii,j);
+			sum2+=collectCountsOverNeighborhoodForSophisticatedModels(
+					*smsc[i].first, smsc[i].second/all_total, d4Table);
+		}
+		if (!(fabs(count-sum2)<0.05))
+			cerr << "WARNING: DIFFERENT SUMS: (" << count << ") (" << sum2 << ") (" << all_total
+					<< ")\n";
+	}
+
+	/**
+	 NOTE! HERE IS THE UPDATE PROCESS！
+	 */
+	if(fabs(all_total)==0){
+		// Error
+		cerr << "Hill climbing yields zero count " << endl;
+	}else{
+	if (addCounts) {
+		for (PositionIndex i=0; i<=l; i++) {
+			for (PositionIndex j=1; j<=m; j++) {
+				LogProb ijadd=dtcount(i, j)/all_total;
+				if (ijadd>COUNTINCREASE_CUTOFF_AL) {
+					tTable.incCount(es[i], fs[j], ijadd);
+					dCountTable.addValue(j, i, l, m, ijadd);
+					aCountTable.addValue(i, j, l, m, ijadd);
+				}
+			}
+			if (i>0)
+				for (PositionIndex n=0; n<MAX_FERTILITY; n++)
+					nCountTable.addValue(es[i], n, ncount(i, n)/all_total);
+		}
+		p0count+=p0/all_total;
+		p1count+=p1/all_total;
+	}}
+	return nAl;
+}
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/collCounts.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/collCounts.h
@ -0,0 +1,80 @@
+/*
+
+Copyright (C) 1999,2000,2001  Franz Josef Och (RWTH Aachen - Lehrstuhl fuer Informatik VI)
+
+This file is part of GIZA++ ( extension of GIZA ).
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef collCounts_h_defined
+#define collCounts_h_defined
+#include "alignment.h"
+#include "transpair_model3.h"
+#include <map>
+#include "MoveSwapMatrix.h"
+#include "D4Tables.h"
+#include "transpair_model4.h"
+
+class OneMoveSwap
+{
+ public:
+  short type;
+  short a,b;
+  OneMoveSwap(short _type,short _a,short _b)
+    : type(_type),a(_a),b(_b)
+    {}
+  OneMoveSwap()
+    : type(0){}
+};
+
+inline bool operator<(const OneMoveSwap&a,const OneMoveSwap&b)
+{
+  if(a.type<b.type)return 1;
+  else if(b.type<a.type)return 0;
+  else if(a.a<b.a)return 1;
+  else if(b.a<a.a)return 0;
+  else return a.b<b.b;
+}
+
+inline bool operator==(const OneMoveSwap&a,const OneMoveSwap&b)
+{
+  return a.type==b.type&&a.a==b.a&&a.b==b.b;
+}
+
+inline ostream&operator<<(ostream&out,const OneMoveSwap&o)
+{
+  return out << '(' << o.type << "," << o.a << "," << o.b << ")";
+}
+
+inline ostream &operator<<(ostream &out,const set<OneMoveSwap>&s)
+{
+  for(set<OneMoveSwap>::const_iterator i=s.begin();i!=s.end();++i)
+    cout << *i << ' ';
+  return out;
+}
+
+bool makeOneMoveSwap(const alignment&a,const alignment&b,set<OneMoveSwap>&oms);
+
+template<class TRANSPAIR,class MODEL>
+int collectCountsOverNeighborhood(const Vector<pair<MoveSwapMatrix<TRANSPAIR>*,LogProb> >&smsc,
+				   Vector<WordIndex>&es,
+				   Vector<WordIndex>&fs,tmodel<COUNT,PROB>&tTable,
+				   amodel<COUNT>&aCountTable,amodel<COUNT>&dCountTable,
+				   nmodel<COUNT>&nCountTable,double&p1count,double&p0count,
+				   LogProb&_total,float count,bool addCounts,MODEL*d4Table=0);
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/common.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/common.h
@ -0,0 +1,3 @@
+/*!
+This is global definition for all main files of the program set
+*/
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/d4norm.cxx
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/d4norm.cxx
@ -0,0 +1,126 @@
+// D4 Normalization executable
+
+#include <iostream>
+#include <strstream>
+#include <string>
+#include "hmm.h"
+#include "D4Tables.h"
+#include "Parameter.h"
+#define ITER_M2 0
+#define ITER_MH 5
+GLOBAL_PARAMETER3(int,Model1_Iterations,"Model1_Iterations","NO. ITERATIONS MODEL 1","m1","number of iterations for Model 1",PARLEV_ITER,5);
+GLOBAL_PARAMETER3(int,Model2_Iterations,"Model2_Iterations","NO. ITERATIONS MODEL 2","m2","number of iterations for Model 2",PARLEV_ITER,ITER_M2);
+GLOBAL_PARAMETER3(int,HMM_Iterations,"HMM_Iterations","mh","number of iterations for HMM alignment model","mh", PARLEV_ITER,ITER_MH);
+GLOBAL_PARAMETER3(int,Model3_Iterations,"Model3_Iterations","NO. ITERATIONS MODEL 3","m3","number of iterations for Model 3",PARLEV_ITER,5);
+GLOBAL_PARAMETER3(int,Model4_Iterations,"Model4_Iterations","NO. ITERATIONS MODEL 4","m4","number of iterations for Model 4",PARLEV_ITER,5);
+GLOBAL_PARAMETER3(int,Model5_Iterations,"Model5_Iterations","NO. ITERATIONS MODEL 5","m5","number of iterations for Model 5",PARLEV_ITER,0);
+GLOBAL_PARAMETER3(int,Model6_Iterations,"Model6_Iterations","NO. ITERATIONS MODEL 6","m6","number of iterations for Model 6",PARLEV_ITER,0);
+
+GLOBAL_PARAMETER(float, PROB_SMOOTH,"probSmooth","probability smoothing (floor) value ",PARLEV_OPTHEUR,1e-7);
+GLOBAL_PARAMETER(float, MINCOUNTINCREASE,"minCountIncrease","minimal count increase",PARLEV_OPTHEUR,1e-7);
+
+GLOBAL_PARAMETER2(int,Transfer_Dump_Freq,"TRANSFER DUMP FREQUENCY","t2to3","output: dump of transfer from Model 2 to 3",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER2(bool,Verbose,"verbose","v","0: not verbose; 1: verbose",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER(bool,Log,"log","0: no logfile; 1: logfile",PARLEV_OUTPUT,0);
+
+GLOBAL_PARAMETER(double,P0,"p0","fixed value for parameter p_0 in IBM-3/4 (if negative then it is determined in training)",PARLEV_EM,-1.0);
+GLOBAL_PARAMETER(double,M5P0,"m5p0","fixed value for parameter p_0 in IBM-5 (if negative then it is determined in training)",PARLEV_EM,-1.0);
+GLOBAL_PARAMETER3(bool,Peg,"pegging","p","DO PEGGING? (Y/N)","0: no pegging; 1: do pegging",PARLEV_EM,0);
+
+GLOBAL_PARAMETER(short,OldADBACKOFF,"adbackoff","",-1,0);
+GLOBAL_PARAMETER2(unsigned int,MAX_SENTENCE_LENGTH,"ml","MAX SENTENCE LENGTH","maximum sentence length",0,MAX_SENTENCE_LENGTH_ALLOWED);
+
+GLOBAL_PARAMETER(short, DeficientDistortionForEmptyWord,"DeficientDistortionForEmptyWord","0: IBM-3/IBM-4 as described in (Brown et al. 1993); 1: distortion model of empty word is deficient; 2: distoriton model of empty word is deficient (differently); setting this parameter also helps to avoid that during IBM-3 and IBM-4 training too many words are aligned with the empty word",PARLEV_MODELS,0);
+
+/**
+Here are parameters to support Load models and dump models
+*/
+
+GLOBAL_PARAMETER(int,restart,"restart","Restart training from a level,0: Normal restart, from model 1, 1: Model 1, 2: Model 2 Init (Using Model 1 model input and train model 2), 3: Model 2, (using model 2 input and train model 2), 4 : HMM Init (Using Model 1 model and train HMM), 5: HMM (Using Model 2 model and train HMM) 6 : HMM (Using HMM Model and train HMM), 7: Model 3 Init (Use HMM model and train model 3) 8: Model 3 Init (Use Model 2 model and train model 3) 9: Model 3, 10: Model 4 Init (Use Model 3 model and train Model 4) 11: Model 4 and on, ",PARLEV_INPUT,0);
+GLOBAL_PARAMETER(bool,dumpCount,"dumpcount","Whether we are going to dump count (in addition to) final output?",PARLEV_OUTPUT,false);
+GLOBAL_PARAMETER(bool,dumpCountUsingWordString,"dumpcountusingwordstring","In count table, should actual word appears or just the id? default is id",PARLEV_OUTPUT,false);
+/// END
+short OutputInAachenFormat=0;
+bool Transfer=TRANSFER;
+bool Transfer2to3=0;
+short NoEmptyWord=0;
+bool FEWDUMPS=0;
+GLOBAL_PARAMETER(bool,ONLYALDUMPS,"ONLYALDUMPS","1: do not write any files",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER(short,NCPUS,"NCPUS","Number of CPUS",PARLEV_EM,2);
+GLOBAL_PARAMETER(short,CompactAlignmentFormat,"CompactAlignmentFormat","0: detailled alignment format, 1: compact alignment format ",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER2(bool,NODUMPS,"NODUMPS","NO FILE DUMPS? (Y/N)","1: do not write any files",PARLEV_OUTPUT,0);
+
+GLOBAL_PARAMETER(WordIndex, MAX_FERTILITY, "MAX_FERTILITY",
+		"maximal fertility for fertility models", PARLEV_EM, 10);
+
+using namespace std;
+string Prefix, LogFilename, OPath, Usage, SourceVocabFilename,
+		TargetVocabFilename, CorpusFilename, TestCorpusFilename, t_Filename,
+		a_Filename, p0_Filename, d_Filename, n_Filename, dictionary_Filename;
+
+
+int main(int argc, char* argv[]){
+	if(argc < 5){
+		cerr << "Usage: " << argv[0] << "  vcb1 vcb2 outputFile baseFile [additional1 ]..." << endl;
+		return 1;
+	}
+	WordClasses ewc,fwc;
+	d4model d4m(MAX_SENTENCE_LENGTH,ewc,fwc);
+	Vector<WordEntry> evlist,fvlist;
+	vcbList eTrainVcbList(evlist), fTrainVcbList(fvlist);
+	TargetVocabFilename = argv[2];
+	SourceVocabFilename = argv[1];
+	eTrainVcbList.setName(argv[1]);
+	fTrainVcbList.setName(argv[2]);
+	eTrainVcbList.readVocabList();
+	fTrainVcbList.readVocabList();
+	string evcbcls = argv[1];
+	string fvcbcls = argv[2];
+	evcbcls += ".classes";
+	fvcbcls += ".classes";
+	d4m.makeWordClasses(eTrainVcbList, fTrainVcbList, evcbcls.c_str(), fvcbcls.c_str(),eTrainVcbList,fTrainVcbList);
+	// Start iteration:
+	for(int i =4; i< argc ; i++){
+		string name = argv[i];
+		string nameA = name ;
+		string nameB = name + ".b";
+		if(d4m.augCount(nameA.c_str(),nameB.c_str())){
+			cerr << "Loading (d4) table " << nameA << "/" << nameB  << " OK" << endl;
+
+		}else{
+			cerr << "ERROR Loading (d) table " << nameA << "  " << nameB << endl;
+		}   
+	}
+
+	d4m.normalizeTable();
+	string DiffOPath = argv[3];
+	string diff1 = DiffOPath;
+	string diff2 = DiffOPath+".b";
+	cerr << "Outputing d4 table to " << diff1 << " " << diff2;
+	d4m.printProbTable(diff1.c_str(),diff2.c_str());
+
+	
+}
+
+// Some utility functions to get it compile..
+
+ofstream logmsg;
+const string str2Num(int n) {
+	string number = "";
+	do {
+		number.insert((size_t)0, 1, (char)(n % 10 + '0'));
+	} while ((n /= 10) > 0);
+	return (number);
+}
+double LAMBDA=1.09;
+
+Vector<map< pair<int,int>,char > > ReferenceAlignment;
+
+double ErrorsInAlignment(const map< pair<int,int>,char >&reference,
+		const Vector<WordIndex>&test, int l, int&missing, int&toomuch,
+		int&eventsMissing, int&eventsToomuch, int pair_no){
+		}
+
+void printGIZAPars(ostream&out){
+}
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/defs.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/defs.h
@ -0,0 +1,78 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef _defs_h
+#define _defs_h 1
+#include <string>
+#include <cmath>
+#include <climits>
+
+const int TRANSFER_SIMPLE=1;
+const int TRANSFER=0;
+
+const unsigned int MAX_SENTENCE_LENGTH_ALLOWED=101;
+const int TRAIN_BUFFER_SIZE= 50000;
+//#ifdef WORDINDEX_WITH_4_BYTE
+typedef unsigned int WordIndex;
+const unsigned int MAX_VOCAB_SIZE=UINT_MAX;
+typedef unsigned int PositionIndex;
+//#else
+//typedef unsigned short WordIndex;
+//const unsigned int MAX_VOCAB_SIZE=USHRT_MAX;
+//typedef unsigned short PositionIndex;
+//#endif
+extern WordIndex MAX_FERTILITY;
+
+const int MAX_W=457979;
+extern double LAMBDA; // Lambda that is used to scale cross_entropy factor
+
+typedef float PROB ;
+typedef float COUNT ;
+ 
+class LogProb {
+ private:
+  double x ;
+ public:
+  LogProb():x(0){}
+  LogProb(double y):x(y){}
+  LogProb(float y):x(y){}
+  LogProb(int y):x(y){}
+  LogProb(WordIndex y):x(y){}
+  operator double() const {return x;}
+  LogProb operator *= (double y) { x *= y ; return *this;}
+  LogProb operator *= (LogProb y) { x *= y.x ; return *this;}
+  LogProb operator /= (double y) { x /= y ; return *this;}
+  LogProb operator /= (LogProb y) { x /= y.x ; return *this;}
+  LogProb operator += (double y) { x += y ; return *this;}
+  LogProb operator += (LogProb y) { x += y.x ; return *this;}
+};
+
+const int PARLEV_ITER=1;
+const int PARLEV_OPTHEUR=2;
+const int PARLEV_OUTPUT=3;
+const int PARLEV_SMOOTH=4;
+const int PARLEV_EM=5;
+const int PARLEV_MODELS=6;
+const int PARLEV_SPECIAL=7;
+const int PARLEV_INPUT=8;
+
+#endif
+  
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/file_spec.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/file_spec.h
@ -0,0 +1,59 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef FILE_SPEC_H
+#define FILE_SPEC_H
+
+#include <ctime>
+#include <cstdlib>
+#include <cstring>
+#include <cstdio>
+
+/* This function returns a string, locally called file_spec. This
+   string is the concatenation of the date and time of execution
+   and the user who is performing the execution */
+/* Originally implemented in C by Yaser Al-Onaizan; 
+   editions for C++ and formatting by Noah A. Smith, 9 July 1999 */
+
+char *Get_File_Spec (){
+  struct tm *local;
+  time_t t;
+  char *user;
+  char time_stmp[57];
+  char *file_spec = 0;
+  
+  t = time(NULL);
+  local = localtime(&t);
+  
+  sprintf(time_stmp, "%02d-%02d-%02d.%02d%02d%02d.", local->tm_year, 
+	  (local->tm_mon + 1), local->tm_mday, local->tm_hour, 
+	  local->tm_min, local->tm_sec);
+  user = getenv("USER");
+
+  file_spec = (char *)malloc(sizeof(char) * 
+			     (strlen(time_stmp) + strlen(user) + 1));
+  file_spec[0] = '\0';
+  strcat(file_spec, time_stmp) ;
+  strcat(file_spec, user);
+  return file_spec;
+}
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/getSentence.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/getSentence.cpp
@ -0,0 +1,470 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* --------------------------------------------------------------------------*
+ *                                                                           *
+ * Module : getSentece                                                       *
+ *                                                                           *
+ * Method Definitions File: getSentence.cc                                   *
+ *                                                                           *
+ * Objective: Defines clases and methods for handling I/O for the parallel   *
+ *            corpus.                                                        *
+ *****************************************************************************/
+
+
+#include "getSentence.h"
+#include <iostream>
+#include <strstream>
+#include <cstdio>
+#include <cstdlib>
+#include <boost/algorithm/string.hpp>
+#include <vector>
+#include <set>
+#include <pthread.h>
+#include "Parameter.h"
+#include "errno.h"
+
+int PrintedTooLong=0;
+
+/* -------------- Method Defnitions for Class sentenceHandler ---------------*/
+
+GLOBAL_PARAMETER(double,ManlexMAX_MULTIPLICITY,"manlexMAX_MULTIPLICITY","",PARLEV_EM,20.0);
+GLOBAL_PARAMETER(double,Manlexfactor1,"manlexfactor1","",PARLEV_EM,0.0);
+GLOBAL_PARAMETER(double,Manlexfactor2,"manlexfactor2","",PARLEV_EM,0.0);
+
+sentenceHandler::sentenceHandler(const char*  filename, vcbList* elist, 
+				 vcbList*  flist) : realCount(0)
+  // This method is the constructor of the class, it also intitializes the 
+  // sentence pair sequential number (count) to zero.
+{
+    pthread_mutex_init(&readsent_mutex,NULL);
+    pthread_mutex_init(&setprob_mutex,NULL);
+
+    position = 0;
+    readflag = false ;
+    allInMemory = false ;
+    inputFilename = filename ;
+    inputFile = new ifstream(filename);
+    pair_no = 0 ;
+    if(!(*inputFile)){
+        cerr << "\nERROR:(a) Cannot open " << filename;
+        exit(1);
+    }
+    currentSentence = 0;
+    totalPairs1 = 0 ;
+    totalPairs2 =0;
+    pair_no = 0 ;
+    noSentInBuffer = 0 ;
+    Buffer.clear();
+    bool isNegative=0;
+	std::set<WordIndex> evoc,fvoc;
+	evoc.insert(0);
+	fvoc.insert(0);
+    if (elist && flist){
+        cout << "Calculating vocabulary frequencies from corpus " << filename << '\n';
+        sentPair s ;
+        while (getNextSentence(s, elist, flist))
+        {
+			for(int i = 0 ; i< s.eSent.size() ; i++){
+				evoc.insert(s.eSent[i]);
+			}
+			for(int i = 0 ; i< s.fSent.size() ; i++){
+				fvoc.insert(s.fSent[i]);
+			}			
+            totalPairs1++;
+            totalPairs2+=s.realCount; 
+            // NOTE: this value might change during training 
+            // for words from the manual dictionary, yet this is ignored!
+            
+            if( s.noOcc<0 )
+                isNegative=1;
+        }
+    }
+    if( isNegative==1 )
+    {
+        cerr << "WARNING: corpus contains negative occurrency frequencies => these are interpreted as entries of a manual dictionary.\n";
+        realCount=new Vector<double>(totalPairs1,1.0);
+    }
+    else
+        realCount=0;
+	elist->compact(evoc);
+	flist->compact(fvoc);
+}
+
+sentenceHandler::sentenceHandler(const char*  filename, vcbList* elist,
+		vcbList*  flist,std::set<WordIndex>& eapp, std::set<WordIndex>& fapp) : realCount(0)
+				   // This method is the constructor of the class, it also intitializes the 
+				   // sentence pair sequential number (count) to z
+{ 
+    pthread_mutex_init(&readsent_mutex,NULL);
+    pthread_mutex_init(&setprob_mutex,NULL);
+    position = 0;
+	readflag = false ;
+	allInMemory = false ;
+	inputFilename = filename ;
+	inputFile = new ifstream(filename);
+	pair_no = 0 ;
+	if(!(*inputFile)){
+		cerr << "\nERROR:(a) Cannot open " << filename;
+		exit(1);
+	}
+	currentSentence = 0;
+	totalPairs1 = 0 ;
+	totalPairs2 =0;
+	pair_no = 0 ;
+	noSentInBuffer = 0 ;
+	Buffer.clear();
+	bool isNegative=0;
+	if (elist && flist){
+		cout << "Calculating vocabulary frequencies from corpus " << filename << '\n';
+		sentPair s ;
+		while (getNextSentence(s, elist, flist))
+		{ 
+			int k;
+			for(k=0;k<s.eSent.size();k++){
+				eapp.insert(s.eSent[k]);
+			}
+			for(k=0;k<s.fSent.size();k++){
+				fapp.insert(s.fSent[k]);
+			}
+			totalPairs1++;
+			totalPairs2+=s.realCount; 
+			// NOTE: this value might change during training 
+			// for words from the manual dictionary, yet this is ignored!
+			
+			if( s.noOcc<0 )
+				isNegative=1;
+		}
+	}
+	if( isNegative==1 )
+	{ 
+		cerr << "WARNING: corpus contains negative occurrency frequencies => these are interpreted as entries of a manual dictionary.\n";   
+		realCount=new Vector<double>(totalPairs1,1.0);
+	}
+	else
+		realCount=0;
+}
+
+void sentenceHandler::rewind()
+{
+    position = 0;
+    currentSentence = 0;
+    readflag = false ;
+    if (!allInMemory || 
+        !(Buffer.size() >= 1 && Buffer[currentSentence].sentenceNo == 1)){
+            // check if the buffer doe not already has the first chunk of pairs 
+            if (Buffer.size() > 0)
+                cerr << ' ' <<  Buffer[currentSentence].sentenceNo << '\n';
+            //    totalPairs = 0 ;
+            pair_no = 0 ;
+            noSentInBuffer = 0 ;
+            Buffer.clear();
+        }
+    if (!allInMemory){
+        delete inputFile;
+        inputFile = new ifstream(inputFilename);
+        if(!(*inputFile)){
+            cerr << "\nERROR:(b) Cannot open " << inputFilename << " " << (int)errno;
+        }
+    }
+}
+
+  
+int sentenceHandler::getNextSentence(sentPair& sent, vcbList* elist, vcbList* flist)
+{
+    pthread_mutex_lock(&readsent_mutex);
+    
+    do{
+        sentPair s ;
+        if (readflag){
+            cerr << "Attempting to read from the end of corpus, rewinding\n";
+            //rewind();
+            break;
+        } 
+        if (currentSentence >= noSentInBuffer){
+            if (allInMemory)
+                break;
+            /* no more sentences in buffer */
+            noSentInBuffer = 0 ;
+            currentSentence = 0 ;
+            Buffer.clear();
+            cout << "Reading more sentence pairs into memory ... \n";
+            while((noSentInBuffer < TRAIN_BUFFER_SIZE) && readNextSentence(s)){
+                if ((s.fSent.size()-1) > (MAX_FERTILITY-1) * (s.eSent.size()-1)){
+                    cerr << "WARNING: The following sentence pair has source/target sentence length ratio more than\n"<<
+                        "the maximum allowed limit for a source word fertility\n"<<
+                        " source length = " << s.eSent.size()-1 << " target length = " << s.fSent.size()-1 <<
+                        " ratio " << double(s.fSent.size()-1)/  (s.eSent.size()-1) << " ferility limit : " <<
+                        MAX_FERTILITY-1 << '\n';
+                    cerr << "Shortening sentence \n";
+                    cerr << s;
+                    s.eSent.resize(min(s.eSent.size(),s.fSent.size()));
+                    s.fSent.resize(min(s.eSent.size(),s.fSent.size()));
+                }
+                Buffer.push_back(s) ;
+                //cerr << s.eAnchor.size() << " " << Buffer[Buffer.size()-1].eAnchor.size()<< endl;
+                if (elist && flist){
+                    if ((*elist).size() > 0)
+                        for (WordIndex i= 0 ; i < s.eSent.size() ; i++){
+                            if (s.eSent[i] >= (*elist).uniqTokens()){
+                                if( PrintedTooLong++<100)
+                                    cerr << "ERROR: source word " << s.eSent[i] << " is not in the vocabulary list \n";
+                                exit(-1);
+                            }
+                            (*elist).incFreq(s.eSent[i], s.realCount);
+                        }
+                    if ((*flist).size() > 0)
+                        for (WordIndex j= 1 ; j < s.fSent.size() ; j++){
+                            if (s.fSent[j] >= (*flist).uniqTokens()){
+                                cerr << "ERROR: target word " << s.fSent[j] << " is not in the vocabulary list \n";
+                                exit(-1);
+                            }
+                            (*flist).incFreq(s.fSent[j], s.realCount);
+                        }
+                }
+                noSentInBuffer++;
+            }
+            if (inputFile->eof()){
+                allInMemory = (Buffer.size() >= 1 && 
+                               Buffer[currentSentence].sentenceNo == 1) ;
+                if (allInMemory)
+                    cout << "Corpus fits in memory, corpus has: " << Buffer.size() <<
+                    " sentence pairs.\n";
+            }
+        }
+        if(noSentInBuffer <= 0 ){
+            //cerr << "# sent in buffer " << noSentInBuffer << '\n';
+            readflag = true ;
+            break;
+        }
+        sent = Buffer[currentSentence++] ;
+       // cerr << currentSentence-1 << " " << sent.eAnchor.size() << " " << Buffer[currentSentence-1].eAnchor.size()<< endl;
+        position ++;
+        if( sent.noOcc<0 && realCount ){
+            if( Manlexfactor1 && sent.noOcc==-1.0 )
+                sent.realCount=Manlexfactor1;
+            else if( Manlexfactor2 && sent.noOcc==-2.0 )
+                sent.realCount=Manlexfactor2;
+            else
+                sent.realCount=(*realCount)[sent.getSentenceNo()-1];
+        }
+        pthread_mutex_unlock(&readsent_mutex);
+        return position ;
+    }while(false);
+    pthread_mutex_unlock(&readsent_mutex);
+    return 0;
+}
+bool sentenceHandler::readNextSentence(sentPair& sent)
+  /* This method reads in a new pair of sentences, each pair is read from the 
+     corpus file as line triples. The first line the no of times this line 
+     pair occured in the corpus, the second line is the source sentence and 
+     the third is the target sentence. The sentences are represented by a space
+     separated positive integer token ids. */
+{
+
+  string line;
+  bool fail(false) ;
+  
+  sent.clear();
+  vector<string> splits;
+  if (getline(*inputFile, line)){
+
+	  boost::algorithm::split(splits,line,boost::algorithm::is_any_of("|#*"));
+
+	  if(splits.size() == 1 || splits.size() == 0){
+		  // continue, no problem
+		  
+	  }else if(splits.size()>=3){
+		  line = splits[0];
+	  }else{
+		  fail = true;
+		  return false;
+	  }
+	  
+    istrstream buffer(line.c_str());
+    buffer >> sent.noOcc;
+    if( sent.noOcc<0 )
+      {
+	if( realCount )
+	  {
+	    if( Manlexfactor1 && sent.noOcc==-1.0 )
+	      sent.realCount=Manlexfactor1;
+	    else if( Manlexfactor2 && sent.noOcc==-2.0 )
+	      sent.realCount=Manlexfactor2;
+	    else
+	      {
+		sent.realCount=(*realCount)[pair_no];
+	      }
+	  }
+	else
+	  sent.realCount=1.0;
+      }
+    else
+      sent.realCount=sent.noOcc;
+  }
+  else {
+    fail = true ;;
+  }
+  if (splits.size()>=3 || getline(*inputFile, line)){
+	  if(splits.size()>=3){
+		  line = splits[1];
+	  }
+    istrstream buffer(line.c_str());
+    WordIndex w;  // w is a local variabe for token id
+    sent.eSent.push_back(0); // each source word is assumed to have 0 == 
+    // a null word (id 0) at the begining of the sentence. 
+    while(buffer>>w){ // read source sentece , word by word .
+      if (sent.eSent.size() < MAX_SENTENCE_LENGTH)
+	sent.eSent.push_back(w);
+      else {
+	if( PrintedTooLong++<100)
+	  cerr << "{WARNING:(a)truncated sentence "<<pair_no<<"}";
+	//cerr << "ERROR: getSentence.cc:getNextSentence(): sentence exceeds preset length limit of : " << MAX_SENTENCE_LENGTH << '\n';
+	//cerr << "The following sentence will be truncated\n" << line;
+	break ;
+      }
+    }
+  }
+  else {
+    fail = true ;
+  }
+  if (splits.size()>=3 ||getline(*inputFile, line)){
+	  if(splits.size()>=3){
+		  line = splits[2];
+	  }
+    istrstream buffer(line.c_str());
+    WordIndex w;  // w is a local variabe for token id
+    sent.fSent.push_back(0); //0 is inserted for program uniformity
+    while(buffer>>w){ // read target sentece , word by word .
+      if (sent.fSent.size() < MAX_SENTENCE_LENGTH)
+	sent.fSent.push_back(w);
+      else {
+	if( PrintedTooLong++<100)
+	  cerr << "{WARNING:(b)truncated sentence "<<pair_no<<"}";
+	//cerr << "ERROR: getSentence.cc:getNextSentence(): sentence exceeds preset length limit of : " << MAX_SENTENCE_LENGTH << '\n';
+	//cerr << "The following sentence will be truncated\n" << line;
+	break ;
+      }
+    }
+  }
+  else {
+    fail = true ;
+  }
+  sent.eAnchor.clear();
+  sent.fAnchor.clear();
+//  cerr << "Splits: " << splits.size() << endl;
+  if(splits.size()>3){
+	  vector<string> al,eal;
+	  al.clear();
+	  boost::algorithm::split(al,splits[3],boost::algorithm::is_any_of(" "));
+	  for(int w = 0 ; w < al.size(); w++){
+		  eal.clear();
+	  	  boost::algorithm::split(eal,al[w],boost::algorithm::is_any_of("-"));
+		  if(eal.size()==2){
+			  int ea = atoi(eal[0].c_str());
+			  int fa = atoi(eal[1].c_str());
+			  if(ea >= sent.eSent.size() || fa >= sent.fSent.size())
+				  continue;
+			  sent.eAnchor.push_back(ea);
+			  sent.fAnchor.push_back(fa);
+		  }
+	  }
+	//  cerr << "Read partial alignment: " << sent.eAnchor.size() << " " <<
+	//	  sent.fAnchor.size() << "\n";
+  }
+  if (fail){
+    sent.eSent.clear();
+    sent.fSent.clear();
+	sent.eAnchor.clear();
+    sent.fAnchor.clear();	  
+    sent.sentenceNo = 0 ;
+    sent.noOcc = 0 ;
+    sent.realCount=0;
+    return(false);
+  }  
+  if( sent.eSent.size()==1||sent.fSent.size()==1 )
+    cerr << "ERROR: Forbidden zero sentence length " << sent.sentenceNo << endl;
+  sent.sentenceNo = ++pair_no;
+  if(pair_no % 100000 == 0) 
+    cout << "[sent:" << sent.sentenceNo  << "]"<< '\n';
+  return true;
+}
+
+double optimize_lambda(Vector<double>&vd)
+{
+  Vector<double> l;
+  for(double lambda=1.0;lambda<ManlexMAX_MULTIPLICITY;lambda+=0.33)
+    {
+      double prod=0.0;
+      for(unsigned int i=0;i<vd.size();++i)
+	{
+	  prod += vd[i]*exp(lambda*vd[i])/(exp(lambda*vd[i])-1.0);
+	}
+      l.push_back(fabs(prod-1.0));
+    }
+  double lam=double(min_element(l.begin(),l.end())-l.begin())*0.33+1.0;
+  if( lam<1.0 )
+    {
+      cerr << "ERROR: lambda is smaller than one: " << lam << endl;
+      for(unsigned int i=0;i<vd.size();++i)
+	cerr << vd[i] << ' ';
+      cerr << endl;
+    }
+  return lam;
+}
+
+void sentenceHandler::setProbOfSentence(const sentPair&s,double d)
+{
+    
+    if( realCount==0 )
+        return;
+    else{
+        pthread_mutex_lock(&setprob_mutex);
+        if( s.noOcc<=0 )
+        {
+            double ed=exp(d);
+            if( oldPairs.size()>0&&(oldPairs.back().get_eSent()!=s.get_eSent()||oldPairs.back().getSentenceNo()>=s.getSentenceNo()) )
+            {
+                double lambda=optimize_lambda(oldProbs);
+                for(unsigned int i=0;i<oldPairs.size();++i)
+                {
+                    if( oldProbs[i]<1e-5 )
+                        (*realCount)[oldPairs[i].getSentenceNo()-1]=1.0;
+                    else
+                        (*realCount)[oldPairs[i].getSentenceNo()-1]=lambda*oldProbs[i]/(1-exp(-lambda*oldProbs[i]));		    
+                }
+                oldPairs.clear();
+                oldProbs.clear();
+            }
+            oldPairs.push_back(s);
+            oldProbs.push_back(ed);
+        }
+        pthread_mutex_unlock(&setprob_mutex);
+    }
+}
+
+/* ------------- End of Method Definition of Class sentenceHandler ----------*/
+
+
+
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/getSentence.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/getSentence.h
@ -0,0 +1,136 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+/* --------------------------------------------------------------------------*
+ *                                                                           *
+ * Module : getSentence                                                      *
+ *                                                                           *
+ * Prototypes File: getSentence.h                                            *
+ *                                                                           *
+ * Objective: Defines clases and methods for handling I/O for the parallel   *
+ *            corpus.                                                        *
+ *****************************************************************************/
+
+
+
+
+
+#ifndef _sentenceHandler_h
+#define _sentenceHandler_h 1
+
+
+#include <iostream>
+#include <fstream>
+#include <string>
+#include <set>
+#include <cstdio>
+#include <cstdlib>
+#include <pthread.h>
+#include "Vector.h"
+#include "defs.h"
+#include "vocab.h"
+#include "Globals.h"
+/*----------------------- Class Prototype Definition ------------------------*
+ Class Name: sentenceHandleer 
+ Objective: This class is defined to handle training sentece pairs from the 
+ parallel corpus. Each pair has: a target sentece, called here French; a 
+ source sentece, called here English sentece; and an integer number denoting
+ the number of times this pair occured in trining corpus. Both source and 
+ target senteces are represented as integer vector (variable size arrays), 
+ each entry is a numeric value which is the token id for the particular token
+ in the sentece.
+
+ *---------------------------------------------------------------------------*/
+
+class sentPair{
+ public:
+  int sentenceNo ;
+  float noOcc;
+  float realCount;
+  Vector<WordIndex> eSent ;
+  Vector<WordIndex> fSent;
+  Vector<WordIndex> eAnchor;
+  Vector<WordIndex> fAnchor;
+ public:
+  sentPair(){};
+  void clear(){ eSent.clear(); fSent.clear();eAnchor.clear(),fAnchor.clear(); noOcc=0; realCount=0; sentenceNo=0;};
+  const Vector<WordIndex>&get_eSent()const
+    { return eSent; }
+  const Vector<WordIndex>&get_fSent()const
+    { return fSent; }
+  int getSentenceNo()const
+    { return sentenceNo; }
+  double getCount()const
+    { return realCount; }
+    
+};
+
+inline ostream&operator<<(ostream&of,const sentPair&s)
+{
+  of << "Sent No: " << s.sentenceNo << " , No. Occurrences: " << s.noOcc << '\n';
+  if( s.noOcc!=s.realCount )
+    of << " Used No. Occurrences: " << s.realCount << '\n';
+  unsigned int i;
+  for(i=0; i < s.eSent.size(); i++)
+    of << s.eSent[i] << ' ';
+  of <<  '\n';
+  for(i=1; i < s.fSent.size(); i++)
+    of << s.fSent[i] << ' ';
+  of << '\n';
+  return of;
+}
+
+/*Thread-safe version of sentence handler*/
+class sentenceHandler{
+public:
+    const char * inputFilename;   // parallel corpus file name, similar for all 
+                            // sentence pair objects
+    ifstream *inputFile;     // parallel corpus file handler
+    Vector<sentPair> Buffer;
+    int noSentInBuffer ;
+    int currentSentence ;
+    int position; /*Sentence position (will be returned)*/
+    int totalPairs1 ;
+    double totalPairs2;
+    bool readflag ; // true if you reach the end of file
+    bool allInMemory ;
+    int pair_no ;
+    Vector<double> *realCount;
+  
+    Vector<sentPair> oldPairs;
+    Vector<double> oldProbs;
+	sentenceHandler(){};
+    sentenceHandler(const char* filename, vcbList* elist=0, vcbList* flist=0);
+    sentenceHandler(const char* filename, vcbList* elist, vcbList* flist,set<WordIndex>& eapp, set<WordIndex>& fapp);
+    void rewind();
+    int getNextSentence(sentPair&, vcbList* = 0, vcbList* = 0);  // will be defined in the definition file, this
+    int getTotalNoPairs1()const {return totalPairs1;};
+    double getTotalNoPairs2()const {return totalPairs2;};
+    // method will read the next pair of sentence from memory buffer
+    void setProbOfSentence(const sentPair&s,double d);
+private:    
+    pthread_mutex_t readsent_mutex; 
+    pthread_mutex_t setprob_mutex;
+    bool readNextSentence(sentPair&);  // will be defined in the definition file, this
+};
+
+#endif
+  
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/hmm.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/hmm.cpp
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/hmm.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/hmm.h
@ -0,0 +1,103 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef _hmm_h
+#define _hmm_h 1
+
+#include <cassert>
+ 
+#include <iostream>
+#include <algorithm>
+#include <functional>
+#include <map>
+#include <set>
+#include "Vector.h"
+#include <utility>
+
+#if __GNUC__>2
+#include <ext/hash_map>
+using __gnu_cxx::hash_map;
+#else
+#include <hash_map>
+#endif
+#include <fstream>
+#include <cmath>
+#include <ctime>
+
+#include "TTables.h"
+#include "ATables.h" 
+#include "getSentence.h"
+#include "defs.h"
+#include "model2.h"
+#include "Perplexity.h"
+#include "vocab.h"
+#include "WordClasses.h"
+#include "HMMTables.h"
+#include "ForwardBackward.h"
+#include "ttableDiff.hpp"
+
+class hmm : public model2{
+public:
+    WordClasses& ewordclasses;
+    WordClasses& fwordclasses;
+public:    
+    HMMTables<int,WordClasses> counts,probs;
+public:
+    template<class MAPPER>
+    void makeWordClasses(const MAPPER&m1,const MAPPER&m2,string efile,string ffile){
+        ifstream estrm(efile.c_str()),fstrm(ffile.c_str());
+        if( !estrm ) {
+            cerr << "ERROR: can not read " << efile << endl;
+        }else
+            ewordclasses.read(estrm,m1,Elist);
+        if( !fstrm )
+            cerr << "ERROR: can not read " << ffile << endl;
+        else
+            fwordclasses.read(fstrm,m2,Flist);
+    }
+    hmm(model2&m2,WordClasses &e, WordClasses& f);
+    void initialize_table_uniformly(sentenceHandler&);
+    int em_with_tricks(int iterations, bool dumpCount = false, 
+	    const char* dumpCountName = NULL, bool useString = false,bool resume=false);
+    CTTableDiff<COUNT,PROB>* em_one_step(int it);
+   // void em_one_step_2(int it,int part);
+    void load_table(const char* aname);
+
+   // void em_loop(Perplexity& perp, sentenceHandler& sHandler1, bool dump_files, 
+     //            const char* alignfile, Perplexity&, bool test,bool doInit,int iter);
+   /* CTTableDiff<COUNT,PROB>* em_loop_1(Perplexity& perp, sentenceHandler& sHandler1, bool dump_files, 
+                 const char* alignfile, Perplexity&, bool test,bool doInit,int iter);*/
+   /* void em_loop_2(    Perplexity& perp, sentenceHandler& sHandler1, 
+		  bool dump_alignment, const char* alignfile, Perplexity& viterbi_perp, 
+	     bool test,bool doInit,int part);*/
+    void em_loop(Perplexity& perp, sentenceHandler& sHandler1, 
+                 bool dump_alignment, const char* alignfile, Perplexity& viterbi_perp, 
+                 bool test,bool doInit,int 
+                 );
+    void em_thread(int it,string alignfile,bool dump_files,bool resume=false);
+    HMMNetwork *makeHMMNetwork(const Vector<WordIndex>& es,const Vector<WordIndex>&fs,bool doInit)const;
+	void clearCountTable();
+    friend class model3;
+};
+//int multi_thread_em(int noIter, int noThread, hmm* base);
+
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/hmmnorm.cxx
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/hmmnorm.cxx
@ -0,0 +1,135 @@
+// HMM Normalization executable
+
+#include <iostream>
+#include <strstream>
+#include <string>
+#include "hmm.h"
+#include "Parameter.h"
+#define ITER_M2 0
+#define ITER_MH 5
+GLOBAL_PARAMETER3(int,Model1_Iterations,"Model1_Iterations","NO. ITERATIONS MODEL 1","m1","number of iterations for Model 1",PARLEV_ITER,5);
+GLOBAL_PARAMETER3(int,Model2_Iterations,"Model2_Iterations","NO. ITERATIONS MODEL 2","m2","number of iterations for Model 2",PARLEV_ITER,ITER_M2);
+GLOBAL_PARAMETER3(int,HMM_Iterations,"HMM_Iterations","mh","number of iterations for HMM alignment model","mh", PARLEV_ITER,ITER_MH);
+GLOBAL_PARAMETER3(int,Model3_Iterations,"Model3_Iterations","NO. ITERATIONS MODEL 3","m3","number of iterations for Model 3",PARLEV_ITER,5);
+GLOBAL_PARAMETER3(int,Model4_Iterations,"Model4_Iterations","NO. ITERATIONS MODEL 4","m4","number of iterations for Model 4",PARLEV_ITER,5);
+GLOBAL_PARAMETER3(int,Model5_Iterations,"Model5_Iterations","NO. ITERATIONS MODEL 5","m5","number of iterations for Model 5",PARLEV_ITER,0);
+GLOBAL_PARAMETER3(int,Model6_Iterations,"Model6_Iterations","NO. ITERATIONS MODEL 6","m6","number of iterations for Model 6",PARLEV_ITER,0);
+
+GLOBAL_PARAMETER(float, PROB_SMOOTH,"probSmooth","probability smoothing (floor) value ",PARLEV_OPTHEUR,1e-7);
+GLOBAL_PARAMETER(float, MINCOUNTINCREASE,"minCountIncrease","minimal count increase",PARLEV_OPTHEUR,1e-7);
+
+GLOBAL_PARAMETER2(int,Transfer_Dump_Freq,"TRANSFER DUMP FREQUENCY","t2to3","output: dump of transfer from Model 2 to 3",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER2(bool,Verbose,"verbose","v","0: not verbose; 1: verbose",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER(bool,Log,"log","0: no logfile; 1: logfile",PARLEV_OUTPUT,0);
+
+GLOBAL_PARAMETER(double,P0,"p0","fixed value for parameter p_0 in IBM-3/4 (if negative then it is determined in training)",PARLEV_EM,-1.0);
+GLOBAL_PARAMETER(double,M5P0,"m5p0","fixed value for parameter p_0 in IBM-5 (if negative then it is determined in training)",PARLEV_EM,-1.0);
+GLOBAL_PARAMETER3(bool,Peg,"pegging","p","DO PEGGING? (Y/N)","0: no pegging; 1: do pegging",PARLEV_EM,0);
+
+GLOBAL_PARAMETER(short,OldADBACKOFF,"adbackoff","",-1,0);
+GLOBAL_PARAMETER2(unsigned int,MAX_SENTENCE_LENGTH,"ml","MAX SENTENCE LENGTH","maximum sentence length",0,MAX_SENTENCE_LENGTH_ALLOWED);
+
+GLOBAL_PARAMETER(short, DeficientDistortionForEmptyWord,"DeficientDistortionForEmptyWord","0: IBM-3/IBM-4 as described in (Brown et al. 1993); 1: distortion model of empty word is deficient; 2: distoriton model of empty word is deficient (differently); setting this parameter also helps to avoid that during IBM-3 and IBM-4 training too many words are aligned with the empty word",PARLEV_MODELS,0);
+
+/**
+Here are parameters to support Load models and dump models
+*/
+
+GLOBAL_PARAMETER(int,restart,"restart","Restart training from a level,0: Normal restart, from model 1, 1: Model 1, 2: Model 2 Init (Using Model 1 model input and train model 2), 3: Model 2, (using model 2 input and train model 2), 4 : HMM Init (Using Model 1 model and train HMM), 5: HMM (Using Model 2 model and train HMM) 6 : HMM (Using HMM Model and train HMM), 7: Model 3 Init (Use HMM model and train model 3) 8: Model 3 Init (Use Model 2 model and train model 3) 9: Model 3, 10: Model 4 Init (Use Model 3 model and train Model 4) 11: Model 4 and on, ",PARLEV_INPUT,0);
+GLOBAL_PARAMETER(bool,dumpCount,"dumpcount","Whether we are going to dump count (in addition to) final output?",PARLEV_OUTPUT,false);
+GLOBAL_PARAMETER(bool,dumpCountUsingWordString,"dumpcountusingwordstring","In count table, should actual word appears or just the id? default is id",PARLEV_OUTPUT,false);
+/// END
+short OutputInAachenFormat=0;
+bool Transfer=TRANSFER;
+bool Transfer2to3=0;
+short NoEmptyWord=0;
+bool FEWDUMPS=0;
+GLOBAL_PARAMETER(bool,ONLYALDUMPS,"ONLYALDUMPS","1: do not write any files",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER(short,NCPUS,"NCPUS","Number of CPUS",PARLEV_EM,2);
+GLOBAL_PARAMETER(short,CompactAlignmentFormat,"CompactAlignmentFormat","0: detailled alignment format, 1: compact alignment format ",PARLEV_OUTPUT,0);
+GLOBAL_PARAMETER2(bool,NODUMPS,"NODUMPS","NO FILE DUMPS? (Y/N)","1: do not write any files",PARLEV_OUTPUT,0);
+
+GLOBAL_PARAMETER(WordIndex, MAX_FERTILITY, "MAX_FERTILITY",
+		"maximal fertility for fertility models", PARLEV_EM, 10);
+
+using namespace std;
+string Prefix, LogFilename, OPath, Usage, SourceVocabFilename,
+		TargetVocabFilename, CorpusFilename, TestCorpusFilename, t_Filename,
+		a_Filename, p0_Filename, d_Filename, n_Filename, dictionary_Filename;
+
+
+int main(int argc, char* argv[]){
+	if(argc < 5){
+		cerr << "Usage: " << argv[0] << " vcb1 vcb2 outputFile baseFile [additional1 ]..." << endl;
+		return 1;
+	}
+	Vector<WordEntry> evlist,fvlist;
+	vcbList eTrainVcbList(evlist), fTrainVcbList(fvlist);
+	TargetVocabFilename = argv[2];
+	SourceVocabFilename = argv[1];
+	eTrainVcbList.setName(argv[1]);
+	fTrainVcbList.setName(argv[2]);
+	eTrainVcbList.readVocabList();
+	fTrainVcbList.readVocabList();
+	Perplexity trainPerp, testPerp, trainViterbiPerp, testViterbiPerp;
+	tmodel<float, float> tTable;
+	sentenceHandler *corpus = new sentenceHandler();
+	
+
+	model1 m1(CorpusFilename.c_str(), eTrainVcbList, fTrainVcbList, tTable,
+		trainPerp, *corpus, &testPerp, corpus, trainViterbiPerp,
+		&testViterbiPerp);
+	amodel<float> aTable(false);
+	amodel<float> aCountTable(false);
+	model2 m2(m1, aTable, aCountTable);
+	WordClasses french,english;
+	hmm h(m2,english,french);
+	string evcbcls = argv[1];
+	string fvcbcls = argv[2];
+	evcbcls += ".classes";
+	fvcbcls += ".classes";
+	h.makeWordClasses(m1.Elist, m1.Flist, evcbcls.c_str(), fvcbcls.c_str());
+	string base = argv[4];
+	string baseA = base+".alpha";
+	string baseB = base+".beta";
+	string output = argv[3];
+	string outputA = output+".alpha";
+	string  outputB = output+".beta";
+	h.probs.readJumps(base.c_str(),NULL,baseA.c_str(), baseB.c_str());
+	// Start iteration:
+	for(int i = 5; i< argc ; i++){
+		string name = argv[i];
+		string nameA = name + ".alpha";
+		string nameB = name + ".beta";
+		if(h.counts.readJumps(name.c_str(),NULL,nameA.c_str(), nameB.c_str()))
+			h.probs.merge(h.counts);
+		else
+			cerr << "Error, cannot load name.c_str()";
+		h.clearCountTable();
+	}
+	h.probs.writeJumps(output.c_str(),NULL,outputA.c_str(), outputB.c_str());
+	delete corpus;
+}
+
+// Some utility functions to get it compile..
+
+ofstream logmsg;
+const string str2Num(int n) {
+	string number = "";
+	do {
+		number.insert((size_t)0, 1, (char)(n % 10 + '0'));
+	} while ((n /= 10) > 0);
+	return (number);
+}
+double LAMBDA=1.09;
+
+Vector<map< pair<int,int>,char > > ReferenceAlignment;
+
+double ErrorsInAlignment(const map< pair<int,int>,char >&reference,
+		const Vector<WordIndex>&test, int l, int&missing, int&toomuch,
+		int&eventsMissing, int&eventsToomuch, int pair_no){
+		}
+
+void printGIZAPars(ostream&out){
+}
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/logprob.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/logprob.cpp
@ -0,0 +1,154 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+//  Routines to perform integer exponential arithmetic.
+//  A number x is represented as n, where x = b**n.
+//  It is assumed that b > 1, something like b = 1.001;
+
+#include "logprob.h"
+#include <cstdlib>
+#include <cstdio>
+#include <iostream>
+#include <fstream>
+#include <string>
+double *LogProb::ntof  = NULL; // Tables will be initialized
+int   *LogProb::addtbl = NULL; // in Initialize function.
+int   *LogProb::subtbl = NULL; //
+
+const int    LogProb::max_2byte_integer =  32767;
+const int    LogProb::min_2byte_integer = -32768;
+const double LogProb::b      = 1.001;   // a logarithm basis
+const double LogProb::logb2  = log(b);
+//const int    LogProb::nmax   = round(78.0E0 * log(1.0E1) / logb2);
+const int    LogProb::nmax   = round(300.0E0 * log(1.0E1) / logb2);
+const int    LogProb::nmin   = -nmax;
+const int    LogProb::tblbnd = round(log((b-1.0E0)/2.0E0)/logb2);
+const int    LogProb::zeron  = round(pow(-2, 23));
+const int    LogProb::onen   = 0;
+const int    LogProb::infn   = onen - zeron;
+
+const int LogProb::initialized = LogProb::Initialize();
+const LogProb LogProb::zero(0);
+const LogProb LogProb::one(1);
+const LogProb LogProb::minus2(1e-2);
+const LogProb LogProb::minus4(1e-4);
+const LogProb LogProb::minus6(1e-6);
+const LogProb LogProb::minus8(1e-8);
+const LogProb LogProb::minus10(1e-10);
+const LogProb LogProb::minus12(1e-12);
+const LogProb LogProb::minus14(1e-14);
+const LogProb LogProb::minus16(1e-16);
+
+// static table initialization function
+int LogProb::Initialize()
+{
+  int nbytes = sizeof(double)*(nmax-nmin+1) + sizeof(int)*(0-tblbnd+1);
+  std::cerr << nbytes << " bytes used for LogProb tables (C++ version)\n";
+  ntof   = new double[nmax-nmin+1];
+  addtbl = new int[-tblbnd+1];
+  subtbl = new int[-tblbnd+1];
+
+  //  char filename[257];
+  //  string filename ;
+  //  ifstream ifs;
+  //  ifs.open(filename.c_str());
+  //  if (!ifs)
+  //    {
+  int i;
+  std::cerr << "Building integer logs conversion tables\n";
+  ntof[0] = 0 ;
+  
+  for (i=nmin+1; i<=nmax; ++i) 
+    {
+      double x = i;
+      ntof[i-nmin] = exp(x*logb2);
+      
+    }
+  for (i=tblbnd; i<=0; ++i) 
+    {
+      double x = 1.0 + pow(b, i);
+      addtbl[i-tblbnd] = round(log(x)/logb2);
+    }
+  double sqrtb = exp(0.5*logb2);
+  for (i=0; i<=-tblbnd; ++i) 
+    {
+      double x = sqrtb * pow(b, i) - 1.0;
+      subtbl[i] = round(log(x)/logb2);
+    }
+  //      if (toolsRoot)
+  //	{
+  //      ofstream ofs(filename.c_str());
+  //      if (!ofs)
+  //	cerr << "Could not write LogProb data to " << filename << endl;
+  //      else
+  //	{
+  //	  ofs.write((const char *)ntof, sizeof(double) * (nmax-nmin+1));
+  //	  ofs.write((const char *)addtbl, sizeof(int) * (-tblbnd+1));
+  //	  ofs.write((const char *)subtbl, sizeof(int) * (-tblbnd+1));
+  //	}
+  //    }
+  //    }
+  //  else
+  //    {
+  //      ifs.read((char *)ntof,   sizeof(double) * (nmax - nmin + 1));
+  //      ifs.read((char *)addtbl, sizeof(int) * (-tblbnd+1));
+  //      ifs.read((char *)subtbl, sizeof(int) * (-tblbnd+1));
+  //    }
+  return 1;
+}
+
+void LogProb::FreeTables()
+{
+   delete [] addtbl;
+   delete [] subtbl;
+   delete [] ntof;
+}
+
+//---------------------------------------------------------------------------
+//            Aritmetic operators
+//---------------------------------------------------------------------------
+
+
+// Subtract two logarithm numbers. Use the following method:
+// b**n - b**m = b**m( b**(n-m) - 1 ), assuming n >= m. 
+LogProb& LogProb::operator-=(const LogProb &subs) 
+{
+  if (subs.logr == zeron)
+    return *this;
+  int a = logr - subs.logr;
+  if (a <= 0)
+    {
+      if (a < 0)
+	{
+	  std::cerr << "WARNING(logprob): Invalid arguments to nsub" <<(*this)<< " " << subs << std::endl;
+	  //abort();
+	}
+      logr = zeron;
+      return *this;
+    }
+  if (a > -tblbnd)
+    return *this;
+  logr = subs.logr + subtbl[a];
+  return *this;
+}
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/logprob.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/logprob.h
@ -0,0 +1,217 @@
+/*
+
+EGYPT Toolkit for Statistical Machine Translation
+Written by Yaser Al-Onaizan, Jan Curin, Michael Jahr, Kevin Knight, John Lafferty, Dan Melamed, David Purdy, Franz Och, Noah Smith, and David Yarowsky.
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+#ifndef _LOGPROB_H
+#define _LOGPROB_H
+
+// Routines to perform integer exponential arithmetic.
+// A number x is represented as n, where x = b**n
+// It is assumed that b > 1, something like b = 1.001
+
+#include <iostream>
+#include <cmath>
+#include <algorithm>
+
+//#define  MAX(A,B) ((A) > (B) ? (A) : (B))
+//#define  MIN(A,B) ((A) > (B) ? (B) : (A))
+
+
+class LogProb {
+public:
+  // mj for cross entropy
+  double base2() const {
+    return (logr * logb2 / log(2));
+  }
+  
+  // Constructors
+  LogProb() : logr(zeron) {}
+  LogProb(const LogProb &obj) : logr(obj.logr) {}
+  LogProb(double x) : logr(x == 0.0 ? zeron : round(log(x)/logb2)) {}
+  // destructor
+  ~LogProb() {}                  // default destructor
+
+  operator double() const    // converts logr to (double) b**logr
+    {
+      if (logr < nmin) return ntof[0];
+      if (logr > nmax) return ntof[nmax-nmin];
+      return ntof[logr-nmin];
+    }
+
+  LogProb &operator=(const LogProb &obj) { logr = obj.logr; return *this; }
+  int operator!() const { return logr == zeron; }
+  
+  // iostream friend specifications
+  friend std::ostream& operator<<(std::ostream& os, const LogProb &obj);
+  friend std::istream& operator>>(std::istream& is, LogProb &obj);
+  friend std::ostream& operator<<=(std::ostream& os, const LogProb &obj);
+  friend std::istream& operator>>=(std::istream& is, LogProb &obj);
+
+  // arithmetic operators 
+  LogProb &operator+=(const LogProb &add)   // logr2 = logb ( b**logr2 + b**logr1 )
+    // Add two numbers represented as logarithms. Use the following method:
+    //   b**n + b**m = b**n(1 + b**(m-n)), assuming n >= m.
+    {
+      if (add.logr == zeron)
+	return *this;
+      if (logr == zeron)
+	{
+	  logr = add.logr;
+	  return *this;
+	}
+      int a = add.logr - logr;
+      if (a > 0)
+	{
+	  a = -a;
+	  logr = add.logr;
+	}
+      if (a < tblbnd)
+	return *this;
+      logr += addtbl[a-tblbnd];
+      return *this;
+    }
+
+  LogProb &operator-=(const LogProb &);   // logr2 = logb ( b**logr2 + b**logr1 )
+  LogProb operator*(const LogProb &mul) const  // logr3 = logr2 + logr1
+    {
+      LogProb result;		// start out with result == 0
+      if ((logr != zeron) && (mul.logr != zeron))
+	result.logr = std::max(logr+mul.logr, zeron);
+      return result;
+    }
+  LogProb operator*(double x) const  // logr3 = logr2 + logr1
+    {
+      return (*this)*(LogProb)x;
+    }
+  LogProb operator^(const int i) const  // logr2 = logr1 * i
+    {
+      LogProb result;		// start out with result == 0
+      //      if ((logr != zeron) && (mul.logr != zeron))
+      	result.logr = logr * i ;
+	return result;
+    }
+  LogProb &operator*=(const LogProb &mul) // logr2 += logr1
+    { 
+      if ((logr == zeron) || (mul.logr == zeron))
+	logr = zeron;
+      else
+	logr = std::max(logr+mul.logr, zeron);
+      return *this;
+    }
+  LogProb operator/(const LogProb &div) const  // logr3 = logr2 -logr1
+    {
+      LogProb result;
+      if (logr != zeron)
+	result.logr = std::max(logr - div.logr, zeron);
+      return result;
+    }
+  LogProb &operator/=(const LogProb &div) // logr2 -= logr1
+    {
+      if (logr != zeron)
+	logr = std::max(logr - div.logr, zeron);
+      return *this;
+    }
+  LogProb operator+(const LogProb &l) const // logr3 = logb ( b**logr2 + b**logr1 )
+    { LogProb result(*this); result += l; return result; }
+  LogProb operator-(const LogProb &l) const // logr3 = logb ( b**logr2 - b**logr1 )
+    { LogProb result(*this); result -= l; return result; }
+  LogProb power(const int n) const // logr2 = logr1 * int
+    { LogProb result(*this); result.logr *= n; return result; }
+  
+  // Conditional operators
+  int operator<(const LogProb &obj)  const { return logr <  obj.logr; }
+  int operator<=(const LogProb &obj) const { return logr <= obj.logr; }
+  int operator>(const LogProb &obj)  const { return logr >  obj.logr; }
+  int operator>=(const LogProb &obj) const { return logr >= obj.logr; }
+  int operator==(const LogProb &obj) const { return logr == obj.logr; }
+  int operator!=(const LogProb &obj) const { return logr != obj.logr; }
+  int operator<(double d)  const { return ((double)*this) < d;  }
+  int operator<=(double d) const { return ((double)*this) <= d; }
+  int operator>(double d)  const { return ((double)*this) >  d; }
+  int operator>=(double d) const { return ((double)*this) >= d; }
+  int operator==(double d) const { return ((double)*this) == d; }
+  int operator!=(double d) const { return ((double)*this) != d; }
+  
+
+  LogProb &SetZero() { logr = zeron; return *this; } // representation of 0,
+  LogProb &SetOne() { logr = onen; return *this; }   // 1, and
+  LogProb &SetInf() { logr = infn; return *this; }   // inf in logarithm domain 
+
+private:
+  int logr;			// a representation of logarithm
+  // static constants
+  static const  int    initialized; // initialization flag
+  static const  double b;
+  static const  double logb2;
+  static const  int    nmin, nmax;
+  static const  int    tblbnd;
+  static const  int    zeron, onen, infn;  // zero, one, and inf in log domain
+  static const  int    max_2byte_integer, min_2byte_integer;
+  
+  // Arithmetic computation Tables
+  static double *ntof;
+  static int   *addtbl;
+  static int   *subtbl;
+
+  static int Initialize();
+
+public:
+  static void FreeTables();
+  // constants for initializing LogProbs to 0 or 1
+  static const LogProb zero;
+  static const LogProb one;
+  static const LogProb minus2;
+  static const LogProb minus4;
+  static const LogProb minus6;
+  static const LogProb minus8;
+  static const LogProb minus10;
+  static const LogProb minus12;
+  static const LogProb minus14;
+  static const LogProb minus16;
+};
+
+// iostream friend operators
+inline std::ostream &operator<<(std::ostream& os, const LogProb &obj)
+{
+  return os << (double) obj;         // output in linear domain, b**logr
+}
+
+inline std::istream &operator>>(std::istream& is, LogProb &obj)
+{
+  double d;
+  is >> d;
+  obj = d;
+  return is;
+}
+
+inline std::ostream &operator<<=(std::ostream& os, const LogProb &obj) // write binary
+{
+  os.write((const char *)&obj.logr, sizeof(obj.logr));
+  return os;
+}
+
+inline std::istream &operator>>=(std::istream& is, LogProb &obj)
+{
+  is.read((char *)&obj.logr, sizeof(obj.logr));
+  return is;
+}
+
+#endif
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/main.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/main.cpp
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/Array.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/Array.h
@ -0,0 +1,370 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+#ifndef ARRAY_H_DEFINED
+#define ARRAY_H_DEFINED
+using namespace std;
+#include "myassert.h"
+#include <algorithm>
+#include <string>
+#include <utility>
+#include <functional>
+#include "my.h"
+
+#define ARRAY_DEBUG
+
+
+template<class T> class Array
+{
+ private:
+  T *p;                  	
+  int realSize;
+  int maxWritten;
+  char a;
+
+  void copy(T *a,const T *b,int n);
+  void copy(T *a,T *b,int n);
+  void _expand();
+		
+ public:
+  Array() 
+    : p(0),realSize(0),maxWritten(-1) ,a(1)
+    {
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY: " << this<<" "<<(void*)p << endl;
+#endif
+    }
+  Array(const Array<T> &x)
+    : p(new T[x.maxWritten+1]),realSize(x.maxWritten+1),maxWritten(x.maxWritten),a(x.a)
+    {
+      copy(p,x.p,realSize);
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY copy: " << this << " " << realSize <<" "<<(void*)p<< endl;
+#endif
+    }
+  explicit Array(int n)
+    : p(new T[n]),realSize(n),maxWritten(n-1),a(0)
+    {
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY with parameter n: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+    }
+  Array(int n,const T&_init,int _a=0)
+    : p(new T[n]),realSize(n),maxWritten(n-1),a(_a)
+    {
+      for(int iii=0;iii<n;iii++)p[iii]=_init;
+#ifdef VERY_ARRAY_DEBUG
+      cout << "MAKE ARRAY with parameter n and init: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+    }
+  
+  ~Array() 
+    { 
+#ifdef VERY_ARRAY_DEBUG
+      cout << "FREE ARRAY: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+      delete [] p;
+    }
+  
+  Array<T>& operator=(const Array<T>&x)
+    {
+      if( this!= &x )
+	{
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "FREE ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+	  
+	  delete [] p;
+	  realSize = x.maxWritten+1;
+	  maxWritten = x.maxWritten;
+	  a = x.a;
+	  p = new T[realSize]; 
+	  copy(p,x.p,realSize);
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "NEW ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+	}
+      return *this;
+    }
+  
+  Array<T>& operator=(Array<T>&x)
+    {
+      if( this!= &x )
+	{
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "FREE ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+	  delete [] p;
+	  realSize = x.maxWritten+1;
+	  maxWritten = x.maxWritten;
+	  a = x.a;
+	  p = new T[realSize]; 
+	  copy(p,x.p,realSize);
+#ifdef VERY_ARRAY_DEBUG
+	  cout << "NEW ARRAY because of operator=: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+	}
+      return *this;
+    }
+  
+  void allowAccess(int n) 
+    { 
+      while( realSize<=n )
+	_expand(); 
+      maxWritten=max(maxWritten,n);
+      massert( maxWritten<realSize );
+    }
+  void resize(int n)
+    {
+      while( realSize<n ) 
+	_expand(); 
+      maxWritten=n-1;
+    }
+  void sort(int until=-1)
+    {
+      if( until== -1 ) until=size();
+      std::sort(p,p+until);
+    }
+  void invsort(int until=-1)
+    {
+      if( until== -1 ) until=size();
+      std::sort(p,p+until,greater<T>());      
+    }
+  void init(int n,const T&_init,bool _a=0)
+    {
+#ifdef VERY_ARRAY_DEBUG
+      cout << "FREE ARRAY because of init: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+      delete []p;
+      p=new T[n];
+      realSize=n;
+      a=_a;
+      maxWritten=n-1;
+      for(int iii=0;iii<n;iii++)p[iii]=_init;
+#ifdef VERY_ARRAY_DEBUG
+      cout << "NEW ARRAY because of init: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+    }
+  inline int size() const
+    {massert( maxWritten<realSize );
+    return maxWritten+1;}
+  inline int low() const
+    { return 0; }
+  inline int high() const
+    { return maxWritten; }
+  inline bool autoexpand() const 
+    {return a;}
+  inline void autoexpand(bool autoExp) 
+    {a=autoExp;}
+  int findMax() const;
+  int findMin() const;
+  const void errorAccess(int n) const;
+  inline T*getPointerToData(){return p;}
+  
+  inline T& operator[](int n)
+    { 
+      if( a && n==maxWritten+1 )
+	allowAccess(n);
+      if( n<0 || n>maxWritten )
+	errorAccess(n);
+      return p[n];
+    }
+  inline const T& operator[](int n) const 
+    { 
+      if(n<0 || n>maxWritten )
+	errorAccess(n);
+      return p[n]; 
+    }
+  const T&top(int n=0) const
+    {return (*this)[maxWritten-n];}
+  T&top(int n=0)
+    {return (*this)[maxWritten-n];}
+  T&push(const T&x)
+    {
+      (*this)[maxWritten+1]=x;
+      return top();
+    }
+  bool writeTo(ostream&out) const
+    {
+      out << "Array ";
+      out << size() << " ";
+      out << a << endl;
+      for(int iv=0;iv<=maxWritten;iv++)
+	{
+	  writeOb(out,(*this)[iv]);
+	  out << endl;
+	}
+      return 1;
+    }
+  bool readFrom(istream&in)
+    {
+      string s;
+      if( !in )
+	{
+	  cerr << "ERROR(Array): file cannot be opened.\n";
+	  return 0;
+	}
+      in >> s;
+      if( !(s=="Array") )
+	{
+	  cerr << "ERROR(Array): Array!='"<<s<<"'\n";
+	  return 0;
+	}
+      int biggest;
+      in >> biggest;
+      in >> a;
+      resize(biggest);
+      for(int iv=0;iv<size();iv++)
+	{
+	  readOb(in,(*this)[iv]);
+	}
+      return 1;
+    }
+};
+
+template<class T> bool operator==(const Array<T> &x, const Array<T> &y)
+{
+  if( &x == &y )
+    return 1;
+  else
+    {
+      if( y.size()!=x.size() )
+	return 0;
+      else
+	{
+	  for(int iii=0;iii<x.size();iii++)
+	    if( !(x[iii]==y[iii]) )
+	      return 0;
+	  return 1;
+	}
+    }
+}
+
+template<class T> bool operator<(const Array<T> &x, const Array<T> &y)
+{
+  if( &x == &y )
+    return 0;
+  else
+    {
+      if( y.size()<x.size() )
+	return !(y<x);
+      for(int iii=0;iii<x.size();iii++)
+	{
+	  massert( iii!=y.size() );
+	  if( x[iii]<y[iii] )
+	    return 1;
+	  else if( y[iii]<x[iii] )
+	    return 0;
+	}
+      return x.size()!=y.size();
+    }
+}
+
+
+template<class T> const void Array<T>:: errorAccess(int n) const
+{
+  cerr 	<< "ERROR: Access to array element " << n 
+	<< " (" << maxWritten << "," << realSize << "," << (void*)p << " " << a << ")\n";
+  cout <<  "ERROR: Access to array element " << n 
+       << " (" << maxWritten << "," << realSize << "," << (void*)p << "  " << a << ")\n";
+  massert(0);
+#ifndef DEBUG
+  abort();
+#endif
+}
+
+template<class T> ostream& operator<<(ostream&o,const Array<T>&a)
+{
+  o << "Array(" << a.size() << "," << a.autoexpand() << "){ ";
+  for(int iii=0;iii<a.size();iii++)
+    o << " " << iii<< ":" << a[iii]<<";";
+  return o << "}\n";
+}
+
+template<class T> istream& operator>>(istream&in, Array<T>&)
+{return in;}
+
+template<class T> int Hash(const Array<T>&a)
+{
+  int n=0;
+  for(int iii=0;iii<a.size();iii++)
+    n+=Hash(a[iii])*(iii+1);
+  return n+a.size()*47;
+}
+template<class T> void Array<T>::copy(T *aa,const T *bb,int n)
+{
+  for(int iii=0;iii<n;iii++)
+    aa[iii]=bb[iii];
+}
+template<class T> void Array<T>::copy(T *aa,T *bb,int n)
+{
+  for(int iii=0;iii<n;iii++)
+    aa[iii]=bb[iii];
+}
+
+template<class T> void Array<T>::_expand()
+{
+#ifdef VERY_ARRAY_DEBUG
+  cout << "FREE ARRAY because of _expand: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+  T *oldp=p;
+  int oldsize=realSize;
+  realSize=realSize*2+1;
+  p=new T[realSize];
+  copy(p,oldp,oldsize);
+  delete [] oldp;
+#ifdef VERY_ARRAY_DEBUG
+  cout << "NEW ARRAY because of _expand: " << this << " " << realSize<<" "<<(void*)p << endl;
+#endif			
+}
+
+template<class T> int Array<T>::findMax() const
+{
+  if( size()==0 )
+    return -1;
+  else
+    {
+      int maxPos=0;
+      for(int iii=1;iii<size();iii++)
+	if( (*this)[maxPos]<(*this)[iii] )
+	  maxPos=iii;
+      return maxPos;
+    }
+}
+template<class T> int Array<T>::findMin() const
+{
+  if( size()==0 )
+    return -1;
+  else
+    {
+      int minPos=0;
+      for(int iii=1;iii<size();iii++)
+	if( (*this)[iii]<(*this)[minPos] )
+	  minPos=iii;
+      return minPos;
+    }
+}
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/FixedArray.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/FixedArray.h
@ -0,0 +1,287 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+#ifndef FIXARRAY_H_DEFINED
+#define FIXARRAY_H_DEFINED
+#include <iostream>
+#include <string>
+#include <functional>
+
+template<class T>
+bool writeOb(ostream&out,const T&f)
+{ 
+  out << f << " "; 
+  return 1;
+}
+
+template<class T>
+bool readOb(istream&in,T&f)
+{ 
+  in >> f;
+  char c;
+  in.get(c);
+  massert(c==' ');
+  return 1;
+}
+
+template<class T>
+bool writeOb(ostream&out,const string &s,const T&f)
+{ 
+  out << s << " " << f << " "; 
+  return 1;
+}
+template<class T>
+bool readOb(istream&in,const string&s,T&f)
+{ 
+  string ss;
+  in >> ss;
+  if( s!=ss )
+    {
+      cerr << "ERROR: readOb should be '" << s << "' and is '" << ss << "'" << endl;
+      return 0;
+    }
+  in >> f; 
+  char c;
+  in.get(c);
+  massert(c==' ');
+  return 1;
+}
+
+template<class T> class FixedArray
+{
+ private:  
+  void copy(T *aa,const T *bb,int nnn)
+    {for(int iii=0;iii<nnn;iii++)aa[iii]=bb[iii];}
+  
+ public:
+  T *p;                       	
+  int realSize;
+  FixedArray() 
+    : p(0),realSize(0){}
+  FixedArray(const FixedArray<T> &x)
+    : p(new T[x.realSize]),realSize(x.realSize) {copy(p,x.p,realSize);}
+  explicit FixedArray(int n)
+    : p(new T[n]),realSize(n){}
+  FixedArray(int n,const T&_init)
+    : p(new T[n]),realSize(n){for(int z=0;z<n;z++)p[z]=_init;}
+  FixedArray(const FixedArray&f,const T&t)
+    : p(new T[f.size()+1]),realSize(f.size()+1){for(int z=0;z<f.size();z++)p[z]=f[z];p[f.size()]=t;}
+  ~FixedArray() 
+    { delete [] p;p=0;realSize=-1;}
+  
+  FixedArray<T>& operator=(const FixedArray<T>&x)
+    {
+      if( this!= &x )
+	{
+	  delete [] p;
+	  realSize = x.realSize;
+	  p = new T[x.realSize]; 
+	  copy(p,x.p,realSize);
+	}
+      return *this;
+    }
+  void resize(int n)
+    {
+      if( n<=realSize )
+	shrink(n);
+      else
+	{
+	  T*np=new T[n];
+	  copy(np,p,realSize);
+	  delete []p;
+	  p=np;
+	  realSize=n;
+	}
+    }
+  void shrink(int n)
+    {
+      assert(n<=realSize);
+      realSize=n;
+    }
+  void init(int n,const T&_init)
+    {
+      delete []p;
+      p=new T[n];
+      realSize=n;
+      for(int l=0;l<n;l++)p[l]=_init;
+    }
+  inline const T&top(int n=0) const
+    {return (*this)[realSize-1-n];}
+  inline int size() const 
+    {return realSize;}
+
+  inline T*begin(){ return p; }
+  inline T*end(){ return p+realSize; }
+
+  inline const T*begin()const{ return p; }
+  inline const T*end()const{return p+realSize;}
+
+  inline int low() const 
+    {return 0;}
+  inline int high() const 
+    {return realSize-1;}
+  const void errorAccess(int n) const;
+  
+  inline T& operator[](int n)
+    { 
+      return p[n];
+    }
+  inline const T& operator[](int n) const 
+    { 
+      return p[n]; 
+    }
+  bool writeTo(ostream&out) const
+    {
+      out << "FixedArray ";
+      out << size() << " ";
+      for(int a=0;a<size();a++)
+	{
+	  writeOb(out,(*this)[a]);
+	  out << " ";
+	}
+      out << endl;
+      return 1;
+    }
+  bool readFrom(istream&in)
+    {
+      string s;
+      if( !in )
+	{
+	  cerr << "ERROR(FixedArray): file cannot be opened.\n";
+	  return 0;
+	}
+      in >> s;
+      if( !(s=="FixedArray") )
+	{
+	  cerr << "ERROR(FixedArray): FixedArray!='"<<s<<"'\n";
+	  return 0;
+	}
+      int biggest;
+      in >> biggest;
+      resize(biggest);
+      for(int a=0;a<size();a++)
+	readOb(in,(*this)[a]);
+      return 1;
+    }
+  void sort(int until=-1)
+    {
+      if( until== -1 ) until=size();
+      std::sort(p,p+until);
+    }
+  void invsort(int until=-1)
+    {
+      if( until== -1 ) until=size();
+      std::sort(p,p+until,greater<T>());      
+    }
+  int binary_locate(const T&t)
+    {
+      T*ppos=std::lower_bound(p,p+size(),t);
+      int pos=ppos-p;
+      if( pos>=-1&&pos<size() )
+	return pos;
+      else
+	return -1;
+    }
+  int binary_search(const T&t)
+    {
+      T*ppos=std::lower_bound(p,p+size(),t);
+      int pos=ppos-p;
+      if( pos>=0&&pos<size()&& *ppos==t )
+	return pos;
+      else
+	return -1;
+    }
+  typedef T* iterator;
+  typedef const T* const_iterator;
+};
+
+template<class T> bool operator<(const FixedArray<T> &x, const FixedArray<T> &y)
+{
+  return lexicographical_compare(x.begin(),x.end(),y.begin(),y.end());
+  
+}
+
+
+template<class T>  bool operator==(const FixedArray<T> &x, const FixedArray<T> &y)
+{
+  if( &x == &y )return 1;
+  const int s = x.size();
+  if( s !=y.size() )return 0;
+  for(int iii=0;iii<s;iii++)
+    if( !(x.p[iii]==y.p[iii]) )
+      return 0;
+  return 1;
+}
+
+template<class T> int Hash(const FixedArray<T>&a)
+{
+  int n=0;
+  const int s=a.size();
+  for(int iii=0;iii<s;iii++)
+    n=13*n+Hash(a.p[iii]);
+  return n;
+}
+
+template<class T> const void FixedArray<T>:: errorAccess(int n) const
+{
+  massert(0);
+  cerr 	<< "ERROR: Access to array element " << n 
+	<< " (" << realSize << "," << (void*)p << ")\n";
+}
+	
+template<class T> ostream& operator<<(ostream&o,const FixedArray<T>&a)
+{
+  o << "FixedArray(" << a.size() << "){ ";
+  for(int iii=0;iii<a.size();iii++)
+    o << " " << iii<< ":" << a[iii]<<";";
+  return o << "}\n";
+}
+
+template<class T> istream& operator>>(istream&in, FixedArray<T>&)
+{ return in;}
+
+template<class T> FixedArray<T> operator+(const FixedArray<T>&a,const FixedArray<T>&b)
+{
+  massert(a.size()==b.size());
+  FixedArray<T> x(a.size());
+  for(int iii=0;iii<a.size();iii++)
+    x[iii]=a[iii]+b[iii];
+  return x;
+}
+template<class T> FixedArray<T> operator|(const FixedArray<T>&aaa,const FixedArray<T>&bbb)
+{
+  iassert(aaa.size()==bbb.size());
+
+  FixedArray<T> xxx(aaa.size());
+  for(int iii=0;iii<aaa.size();iii++)
+    xxx.p[iii]=aaa.p[iii]||bbb.p[iii];
+  return xxx;
+}
+
+#endif
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/FlexArray.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/FlexArray.h
@ -0,0 +1,48 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+#ifndef CLASS_FlexArray_defined
+#define CLASS_FlexArray_defined
+#include "FixedArray.h"
+
+template<class T>
+class FlexArray
+{
+private:
+  FixedArray<T> p;
+  int start,end;
+public:
+  FlexArray(int _start=0,int _end=-1)
+    : p(_end-_start+1),start(_start),end(_end) {}
+  T&operator[](int i)
+    {return p[i-start];}
+  const T&operator[](int i)const
+    {returnp[i-start];}
+  int low()const{return start;}
+  int high()const{return end;}
+};
+
+
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/GDAOptimization.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/GDAOptimization.cpp
@ -0,0 +1,159 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+#include "GDAOptimization.h"
+#include "ProblemTest.h"
+#include <cmath>
+
+#define GDAOptimization GDAOptimization
+#define IterOptimization IterOptimization
+
+     
+     
+double GDAOptimization::defaultTemperatur=1e100;
+
+
+double GDAOptimization::defaultAlpha=0.001;
+
+
+     
+GDAOptimization::GDAOptimization(Problem &p,int m) 
+: IterOptimization(p,m) ,temperatur(defaultTemperatur),alpha(defaultAlpha)
+{
+}
+
+     
+GDAOptimization::GDAOptimization(Problem &p,double t,double a,int m) 
+: IterOptimization(p,m) ,temperatur(t) ,alpha(a)
+{
+}
+
+     
+GDAOptimization::GDAOptimization(GDAOptimization &o)
+: IterOptimization(o)
+{
+  temperatur = o.temperatur;
+  alpha      = o.alpha;
+  gdaEndFlag = o.gdaEndFlag;
+}
+
+     
+void GDAOptimization::zInitialize()
+{
+  IterOptimization::zInitialize();
+  if(temperatur==1e100)
+    { 
+      double v=problem.value(); 
+      
+      
+      
+      
+      
+      temperatur=v;
+    	}
+  assert(alpha>=0);
+}
+
+short GDAOptimization::accept(double delta)
+{
+  if(  curValue + delta < temperatur )
+    return 1;
+  else
+    return 0;
+}
+
+void  GDAOptimization::abkuehlen()
+{
+  double newTemperatur =  temperatur - alpha*(temperatur - curValue);
+  if( fabs(temperatur - newTemperatur)<1e-30 ) 
+    gdaEndFlag=1;
+  else
+    gdaEndFlag=0;
+  temperatur = newTemperatur;
+}
+
+short GDAOptimization::end()
+{
+  return ( endFlag>0 ) && ( gdaEndFlag );
+}
+
+void GDAOptimization::makeGraphOutput()
+{
+  IterOptimization::makeGraphOutput();
+  *GraphOutput << temperatur-curValue;
+}
+	
+
+
+     
+double GDAOptimization::optimizeValue(Problem &p,int proParameter,int numParameter,int typ,
+			 int optimierungsschritte,int print)
+{
+  if(typ!=1)
+    {
+      cerr << "Error: wrong parameter-type in GDAOptimization::optimizeValue ("
+	<< typ << ")\n";
+      exit(1);
+    }
+  else
+    {
+      double bestPar=-1,best=1e100;
+      double now;
+      if( print )
+	cout << "#GDA-optimizeValues: " << numParameter<<endl;
+
+      
+      defaultTemperatur=1e100; 
+
+      for(int i=0;i<=numParameter;i++)
+	{
+	  StatVar end,laufzeit,init;
+	  defaultAlpha = pow(pow(200,1.0/numParameter),i)*0.002;
+	  solveProblem(0,p,proParameter,optimierungsschritte,GDA_OPT,now,end,
+		       laufzeit,init);
+	  if( best>now )
+	    {
+	      best=now;
+	      bestPar=defaultAlpha;
+	    }
+	  if( print )
+	    {
+	      cout << defaultAlpha <<" ";
+	      cout << end.getMean() << " " << end.quantil(0.2) << " " 
+		<< end.quantil(0.79) << "  " << laufzeit.getMean() << " " 
+		<< end.quantil(0.0) << " " << end.getSigma() << " " 
+		<< end.getSigmaSmaller()<< " "<< end.getSigmaBigger()<< endl;
+	    }
+	}
+      if( print )
+	cout << "#Parameter Mittelwert 0.2-Quantil 0.8-Quantil Laufzeit"
+	        " Bester Sigma SigmaSmaller SigmaBigger\n";
+      defaultAlpha=0.03;
+      return bestPar;
+    }
+	return 1e100;
+}
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/GDAOptimization.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/GDAOptimization.h
@ -0,0 +1,80 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+
+
+#ifndef GDAOPTIMIZATION
+#define GDAOPTIMIZATION
+#include "IterOptimization.h"
+
+class GDAOptimization : public IterOptimization
+{
+  
+   private:
+     double temperatur;  
+     double alpha;       
+     short gdaEndFlag; 
+                       
+
+   protected:
+      virtual void zInitialize();
+     
+
+      virtual short accept(double delta); 
+     
+     
+      virtual void  abkuehlen();
+     
+
+      virtual short end();
+     
+
+      virtual void makeGraphOutput();
+     
+
+   public:
+      GDAOptimization(Problem &p,double temperatur,double alpha,
+     int maxIter=-1);
+     
+
+      GDAOptimization(Problem &p,int maxIter=-1);
+     
+
+      GDAOptimization(GDAOptimization &o);
+     
+
+      static double optimizeValue(Problem &p,int proParameter,
+     int numParameter,int typ,int schritte= -1,int verbose=1);
+     
+
+     
+     static double defaultTemperatur; 
+     static double defaultAlpha;      
+
+};
+#endif
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/HCOptimization.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/HCOptimization.cpp
@ -0,0 +1,57 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+#include "HCOptimization.h"
+
+HCOptimization::HCOptimization(Problem &p,int m) 
+: IterOptimization(p,m) 
+{
+  if( maxStep<=0 )
+    maxStep=(int)(problem.expectedNumberOfIterations());
+}
+HCOptimization::HCOptimization(HCOptimization &o)
+: IterOptimization(o)
+{
+}
+
+
+short HCOptimization::accept(double delta)
+{
+  if( delta < 0 )
+    return 1;
+  else
+    return 0;
+}
+short HCOptimization::end() 
+{ 
+  return endFlag>0; 
+}
+void HCOptimization::abkuehlen()
+{
+}
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/HCOptimization.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/HCOptimization.h
@ -0,0 +1,54 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+
+
+#ifndef HCOPTIMIZATION
+#define HCOPTIMIZATION
+#include "IterOptimization.h"
+
+class HCOptimization : public IterOptimization
+{
+  
+   protected:
+      virtual short accept(double delta); 
+     
+
+      virtual void  abkuehlen();
+     
+
+      virtual short end();
+     
+
+   public:
+      HCOptimization(Problem &p,int maxIter=-1);
+     
+
+      HCOptimization(HCOptimization &o);
+     
+
+};
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/IterOptimization.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/IterOptimization.cpp
@ -0,0 +1,199 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+#include "IterOptimization.h"
+#include "ProblemTest.h"
+
+ostream *GraphOutput; 
+
+
+  
+IterOptimization::IterOptimization(Problem& p,int m) 
+  : maxNonBetterIterations(0),problem(p),maxStep(m),initialisiert(0)
+{
+}
+
+
+
+IterOptimization::IterOptimization(IterOptimization& o) : Optimization(),problem(o.problem)
+{
+  maxNonBetterIterations=o.maxNonBetterIterations;
+  curValue = o.curValue;
+  bestStep = o.bestStep;
+  bestValue = o.bestValue;
+  maxStep = o.maxStep;
+  initialisiert = o.initialisiert;
+  endFlag = o.endFlag;
+  endFlag2 = o.endFlag2;
+}
+
+
+     
+double IterOptimization::minimize(int steps)
+{
+  if( !initialisiert )
+    zInitialize();
+  
+  if( steps==0 )
+    return curValue;
+  
+  int t=0;
+  int every=(steps<0)?10000:(steps/1000+1);
+  
+  do
+    {
+      curStep++; 
+      t++;
+      if(verboseMode&&(curStep%1000==0))
+	{
+	  if(steps>0)
+	    cout << "Processed: " << 100.0*(curStep/(double)max(maxStep,1)) << " percent. (IterOptimization run) " 
+		 << curValue << " max:" << maxStep << " " << steps << "            \r";
+	  else
+	    cout << "In step:" << curStep << " currentValue: " << curValue 
+		 << " bestValue: " << bestValue-curValue << " " << curStep-bestStep << ".           \r";
+	  cout.flush();
+	}
+      
+      
+      ProblemChange *change= &(problem.change());
+      
+      
+      double delta=problem.valueChange(*change);
+      
+      
+      abkuehlen();
+      
+      
+      if( accept(delta) )
+	{
+	  
+	  problem.doChange(*change);
+	  
+	  
+	  curValue+=delta;
+	  
+	  
+	  if( curValue<bestValue-1e-10 )
+	    {
+	      bestValue=curValue;
+	      bestStep=curStep;
+	      endFlag2=endFlag=0;
+	    }
+	  
+	  if( verboseMode>1 )
+	    cout<<"in step: "<<curStep<<" accepted with : "<<delta<<endl;
+	}
+      
+      if(curStep - bestStep>maxNonBetterIterations && maxNonBetterIterations>0)
+	endFlag=1;
+      if(curStep - bestStep>2*maxNonBetterIterations && maxNonBetterIterations>0)
+	endFlag2=1;
+      
+      
+      
+      if( GraphOutput&&((curStep%every)==0) )
+	{
+	  makeGraphOutput();
+	  *GraphOutput<<" "<<delta<<endl;
+	}
+      
+      delete change;
+    } while( t!=steps && (!end()) && (!problem.endCriterion()) );
+  
+  if( GraphOutput)
+    {
+      makeGraphOutput();
+      *GraphOutput<<endl;
+    }
+  return curValue;
+}
+
+
+void IterOptimization::zInitialize() 
+{
+  initialisiert=1;
+  bestValue=curValue=problem.value();
+  maxNonBetterIterations=problem.maxNonBetterIterations();
+  bestStep=curStep=0;
+  endFlag2=endFlag=0;
+}
+
+
+void IterOptimization::makeGraphOutput()
+{
+  
+  *GraphOutput << curStep << " " <<curValue << " ";
+}
+
+
+double IterOptimizationOptimizeParameter(Problem &p,
+					 double &parameter,double min,double max,
+					 int nRun,int nPar,int verfahren,
+					 double &bv)
+{
+  if( nPar<=0 )
+    return (max+min)/2;
+  
+  StatVar end1,time1,init1;
+  StatVar end2,time2,init2;
+  double mean1,mean2;
+  double par1,par2;
+
+  parameter = par1 = min + (max-min)/3;
+  solveProblem(0,p,nRun,-1,verfahren,mean1,end1,time1,init1);
+  cout << parameter << " " << mean1 << " " << end1.quantil(0.0) << " " << end1.quantil(1.0) << endl;
+
+  parameter = par2 = min + 2*(max-min)/3;
+  solveProblem(0,p,nRun,-1,verfahren,mean2,end2,time2,init2);
+  cout << parameter << " " << mean2 << " " << end2.quantil(0.0) << " " << end2.quantil(1.0) << endl;
+  
+  double bestPar,bestVal;
+  if(mean1<mean2)
+    {
+      bestVal = mean1;
+      bestPar=IterOptimizationOptimizeParameter(p,parameter,min,min+2*(max-min)/3,nRun,nPar-2,verfahren,bestVal);
+    }
+  else
+    {
+      bestVal = mean2;
+      bestPar=IterOptimizationOptimizeParameter(p,parameter,min+(max-min)/3,max,nRun,nPar-2,verfahren,bestVal);
+    }
+  if( mean1<bestVal&&mean1<=mean2 )
+    {
+      bv = mean1;
+      return par1;
+    }
+  else if(mean2<bestVal && mean2<=mean1)
+    {
+      bv = mean2;
+      return par2;
+    }
+  else
+    {
+      bv = bestVal;
+      return bestPar;
+    }
+}
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/IterOptimization.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/IterOptimization.h
@ -0,0 +1,123 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+
+
+
+#ifndef ITEROPTIMIZATION
+#define ITEROPTIMIZATION
+
+#include "Optimization.h"
+
+
+
+
+
+#define ANZ_VERSCHLECHTERUNGEN 500 
+
+extern ostream *GraphOutput; 
+                             
+
+class IterOptimization : public Optimization
+	{
+  
+
+   private:   
+     int maxNonBetterIterations; 
+     
+
+   protected:
+     Problem &problem;  
+     int curStep;	
+     double curValue;	
+     int bestStep;      
+     double bestValue;	
+     int maxStep;       
+     int initialisiert; 
+     short endFlag;     
+     short endFlag2;     
+       
+       
+
+
+      virtual void makeGraphOutput();
+     
+
+      virtual short end()=0;
+     
+
+      virtual void  abkuehlen()=0;
+     
+
+      virtual short accept(double delta)=0;
+     
+
+      virtual void zInitialize();
+     
+
+   public:
+      IterOptimization(Problem &p,int maxIter=-1);
+     
+
+      IterOptimization(IterOptimization &o);
+     
+
+      virtual double minimize(int steps=-1);
+     
+
+      inline int getCurStep();
+     
+
+      inline double getCurrentValue(); 
+     
+
+      inline const Problem& getProblem(); 
+     
+
+};
+
+double IterOptimizationOptimizeParameter(Problem &p,
+			     double &parameter,double min,double max,
+			     int nRun,int nPar,int verfahren,double &bv);
+
+inline int IterOptimization::getCurStep() 
+{ 
+  return curStep;
+};
+inline double IterOptimization::getCurrentValue() 
+{ 
+  return curValue; 
+}; 
+inline const Problem& IterOptimization::getProblem() 
+{ 
+  return problem; 
+}; 
+
+#endif
+
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblem.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblem.cpp
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblem.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblem.h
@ -0,0 +1,439 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+
+
+#ifndef KATEG_OPT_H
+#define KATEG_OPT_H
+#include <string>
+
+#include <stdlib.h>
+#include "Problem.h"
+
+extern double rhoLo; 
+
+typedef int Kategory;        
+typedef int Word;
+
+
+
+#ifdef FREQTYPE_DOUBLE
+typedef double FreqType;
+#else
+typedef int FreqType;
+#endif
+
+
+#include "KategProblemWBC.h" 
+
+
+#include "KategProblemKBC.h" 
+
+
+enum { 
+  INIT_RAN=1,
+  INIT_AIO=2,
+  INIT_LWRW=3,
+  INIT_FREQ=4,
+  INIT_OTHER=5
+     };
+
+
+enum { 
+  W_RAN=(8|16),
+  W_DET_DECR=(16),
+  W_DET_INCR =(32)
+};
+#define CHOOSE_WORD (8|16|32)
+
+
+enum {
+  K_DET=(64),
+  K_RAN=(128),
+  K_BEST=(64|128)
+};
+#define CHOOSE_KAT (64|128)
+
+
+enum {
+  CRITERION_ML=0,
+  CRITERION_LO=1,
+  CRITERION_MY=2
+};
+
+
+
+class NWG
+{
+ private:
+  Array<FreqType> freq;       
+
+  Array<int> timeOfFreq; 
+                         
+                         
+			 
+
+  int curTime;           
+ public:
+  NWG(int n);            
+  void init();           
+
+  int anzNot0;           
+                         
+
+  Array<int> not0;       
+                         
+  int word;          
+
+  inline void addFreq(int C,FreqType n); 
+
+  void sort();           
+                         
+  FreqType getFreq(int i)     
+    {
+      if( timeOfFreq[i]==curTime )
+	return freq[i];
+      else
+	return 0;
+    };
+};
+
+inline void NWG::addFreq(int g,FreqType n)
+{
+  if(timeOfFreq[g]==curTime)
+    freq[g]+=n;
+  else
+    {
+      timeOfFreq[g]=curTime;
+      freq[g]=n;
+      not0[anzNot0++]=g;
+    }
+}
+
+
+
+struct KategProblemChange : public ProblemChange
+{
+  void *operator new(size_t size);
+  void operator delete(void *ptr,size_t size);
+
+  int word;     
+  int toKat;    
+  int fromKat;  
+};
+
+class KategProblem : public Problem
+{
+ private:
+  double kat_h_full(int n);
+  double kat_h_full(double n);
+  double kat_h_part(int n);
+  double kat_h_part(double n);
+  double sigmaVerfaelschung;
+  short katWasEmpty;
+                    
+		    
+
+  int nwgWord;
+              
+  NWG nwg; 
+  NWG ngw; 
+  FreqType nww; 
+
+  int ursprung,ziel;    
+ 
+  Array<int> _katOfWord; 
+
+  int _maxComp,_maxCompVal;
+
+   double nmo_my(int i,int j);                            
+   double nmo(int i,int j);                            
+      
+
+  double nmo_lo(int i,int j,int &e0,int &e1); 
+  
+
+   void putWord(int word,int to);
+  
+
+   void fastPutWord(int word,int to);
+  
+
+   void setKatOfWord(int w,int k)
+{
+  if( !(wordFreq.fixedWord[w]==k||wordFreq.fixedWord[w]==-1||k==-1) )
+    {
+      cout << "mkcls::setKatOfWord::ERROR: " << w << " " << k << " " << wordFreq.fixedWord[w] << " " << (*words)[w] << endl;
+    }
+  _katOfWord[w]=k;
+  nwgWord=-1;
+};
+  
+
+   void fillNWG(int w);
+  
+
+   inline FreqType nstrich(int i,int j);
+  
+
+   void vnstrich(int i,int j);
+  
+
+
+ protected:
+   virtual int _change(ProblemChange **p);
+  
+
+   virtual void _doChange(ProblemChange &c);
+  
+
+   virtual void _undoChange(ProblemChange &c);
+  
+
+   virtual double _value();
+  
+
+   double _valueChange(KategProblemChange &k);
+  
+
+   virtual void incrementDirection();
+  
+
+   virtual int maxDimensionVal(void) ;
+  
+
+   virtual int maxDimension(void) ;
+  
+  
+public:
+  leda_array<string> *words;
+typedef leda_set<int> intSet;
+
+leda_array<intSet> *kats;
+	
+  KategProblemWBC wordFreq;   
+  KategProblemKBC katFreq;    
+
+  Array<int> initLike; 
+  
+   KategProblem(int aw,int mak,int _initialisierung,int _auswertung,
+                           int _nachbarschaft,int minw=0);
+  
+
+  virtual ~KategProblem();
+  
+
+   virtual void _initialize(int initTyp);
+   virtual void _initialize(int initTyp,int specialFixedWord);
+  
+
+   virtual double valueChange(ProblemChange&c);
+  
+
+   virtual Problem *makeEqualProblem();
+  
+
+   virtual double nicevalue(double value=1e100);
+  
+
+   void makeKats();
+  
+
+   virtual void dumpOn(ostream &strm);
+  
+
+   virtual void dumpInfos(ostream &strm);
+  
+
+  
+  
+  
+   inline void katwahl(int k);
+  
+
+   inline void wortwahl(int w);
+  
+
+  
+  
+  
+   inline int katOfWord(int w);
+  
+
+   inline short wortwahl();
+  
+
+   inline short katwahl() ;
+  
+
+   virtual int maxNonBetterIterations();
+  
+
+   virtual int expectedNumberOfIterations();
+  
+
+   const char *getString(int i);
+   string getTheString(int i);
+  
+
+ void makeTitle(char x[512]);
+
+
+ void fixInitLike();
+
+};
+
+inline int KategProblem::katOfWord(int w){return _katOfWord[w];};
+inline short KategProblem::wortwahl(){return nachbarschaft&CHOOSE_WORD;};
+inline short KategProblem::katwahl() {return nachbarschaft&CHOOSE_KAT;};
+
+inline void KategProblem::katwahl(int k) 
+    { 
+      nachbarschaft = (nachbarschaft&(~CHOOSE_KAT)) | k; 
+      if(k==K_BEST)
+	_maxCompVal=1;
+      else
+	_maxCompVal=katFreq.nKats-2;
+    };
+
+inline void KategProblem::wortwahl(int w) 
+    { 
+      nachbarschaft = (nachbarschaft&(~CHOOSE_WORD)) | w;
+    };
+
+
+
+inline FreqType KategProblem::nstrich(int i,int j)
+{
+  FreqType n=0;
+
+  if( i==ursprung )
+    n-=nwg.getFreq(j); 
+  if( i==ziel )
+    n+=nwg.getFreq(j);
+
+  if( j==ursprung )
+    n-=ngw.getFreq(i);
+  if( j==ziel )
+    n+=ngw.getFreq(i);
+
+  if( i==ursprung && j==ursprung )
+    n+=nww;
+  if( i==ziel && j==ziel )
+    n+=nww;
+
+  if( i==ursprung && j==ziel )
+    n-=nww;
+  if( i==ziel && j==ursprung )
+    n-=nww;
+  
+  return n;
+}
+
+
+
+
+
+#define MAX_H_TABLE 4000 
+extern double h_table[],l_table[],hmy_table[],hmy_sigma;
+
+ 
+inline double kat_mlog(double x)
+{
+  if(x<=1e-9)
+    return 0;
+  else
+    return log(x);
+}
+
+ 
+inline double kat_mlog(int s)
+{
+  if(s<=0)
+    return 0;
+  else if( s<MAX_H_TABLE )
+    {
+      massert( s==0 || l_table[s]==log(s) );
+      return l_table[s];
+    }
+  else 
+    return log((double)(s));
+}
+
+
+ 
+inline double kat_hlo(int n)
+{
+  return n*kat_mlog(n-1);
+}
+ 
+inline double kat_hlo(double n)
+{
+  return n*kat_mlog(n-1);
+}
+
+ 
+inline double kat_h(int n)
+{
+  massert(n>=-1);
+  if(n<=0)
+    return 0;
+  else
+    if(n<MAX_H_TABLE)
+      {
+	massert(n==0||fabs(h_table[n]-n*log((double)n))<1e-8);
+	return h_table[n];
+      }
+    else
+      return n*log((double)(n));
+}
+inline double kat_h(double n)
+{
+  if(n<=1e-9)
+    return 0;
+  else
+    return n*log(n);
+}
+
+ 
+inline double kat_etaFkt(int _e0,int e1,int immer0,int cats)
+{
+  int e0    = _e0 - immer0;
+  int ePlus = cats*cats - _e0;
+  if(cats*cats-e0>1)
+    return e1*log( (ePlus-1.0)/(e0+1.0)*rhoLo );
+  else
+    return 0;
+}
+
+double mkat_h_full(int n,double tf);
+double mkat_h_part(int n,double cf);
+
+int Hash(const string& s);
+
+
+#endif
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblemKBC.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblemKBC.cpp
@ -0,0 +1,243 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+#include <cstdlib>
+#include "KategProblem.h"
+
+double rhoLo=0.75; 
+#define MAX_VERFAELSCHUNG 5000
+double verfTab[MAX_VERFAELSCHUNG],verfTabSigma=-1.0;
+double verfaelsche(int a,double b)
+{
+  
+  if( a>=0&&verfTabSigma==b&&a<MAX_VERFAELSCHUNG )
+    {
+      massert(verfTab[a]== b*(erf(10000.0) - erf(a/b))/2+a);
+      return verfTab[a];
+    }
+  else
+    {
+      double x = b*(erf(10000.0) - erf(a/b))/2+a;
+      return x;
+    }
+}
+double verfaelsche(double,double b)
+{
+  abort();
+  return b;
+}
+
+KategProblemKBC::KategProblemKBC(int s,double sv) : 
+  _n(s),_n1(s,0),_n2(s,0),sigmaVerfaelschung(sv),withVerfaelschung(sv!=0.0),
+  _nverf(s),_n1verf(s,0.0),_n2verf(s,0.0),_nWords(0),
+  eta0(s*s),eta1(0),c1_0(s),c2_0(s),
+  _bigramVerfSum(0.0),_unigramVerfSum1(0.0),_unigramVerfSum2(0.0),nKats(s)
+  
+{ 
+  verfInit0=0.0;
+  int i;
+  if( withVerfaelschung )
+    {
+      verfInit0=verfaelsche(0,sv);
+      cout << "VERFAELSCHUNG wird mitgefuehrt => LANGSAMER!!!\n";
+    }
+  for(i=0;i<s;i++)
+    {
+      _n[i].init(s,0);
+      _nverf[i].init(s,verfInit0);
+      _n1verf[i]=_n2verf[i]=verfInit0;
+      _bigramVerfSum+=verfInit0*s;
+      _unigramVerfSum1+=verfInit0;
+      _unigramVerfSum2+=verfInit0;
+    }
+  if( withVerfaelschung )
+    {
+      cout << "VERFAELSCHUNG " << _bigramVerfSum << " " << _unigramVerfSum1 << " " << _unigramVerfSum2 << endl;
+    }
+  verfTabSigma=sigmaVerfaelschung;
+  
+  
+  
+}
+
+void KategProblemKBC::setN(int w1,int w2, FreqType n)
+  
+{
+  addN(w1,w2,-_n[w1][w2]);
+  addN(w1,w2,n);
+}
+  
+
+double KategProblemKBC::fullBewertung(int auswertung)
+{
+  
+  double bewertung=0;
+  int c1,c2;
+  
+
+  switch( auswertung )
+    {
+    case CRITERION_ML:
+      for(c1=0;c1<nKats;c1++)
+	{
+	  for(c2=0;c2<nKats;c2++)
+	    bewertung-=kat_h(_n[c1][c2]);
+	  bewertung+=kat_h(_n1[c1])+kat_h(_n2[c1]);
+	}
+      break;
+    case CRITERION_MY:
+      {
+      for(c1=0;c1<nKats;c1++)
+	{
+	  for(c2=0;c2<nKats;c2++)
+	    bewertung-=mkat_h_full((int)n(c1,c2),nverf(c1,c2));
+	  bewertung+=mkat_h_part((int)(n1(c1)),n1verf(c1))+mkat_h_part((int)(n2(c1)),n2verf(c1));
+	}
+      double u1=_unigramVerfSum1-verfInit0*c1_0;
+      double u2=_unigramVerfSum2-verfInit0*c2_0;
+      double b=_bigramVerfSum-verfInit0*(c1_0*nKats+c2_0*nKats-c1_0*c2_0);
+      if( verboseMode>1 )
+	{
+	  cout << "CRITERION_MY: " << bewertung << endl;
+	  cout << "U1:"<<_unigramVerfSum1 << " n:"<<u1<< " " 
+	       << "U2:"<<_unigramVerfSum2 << " n:"<<u2<< " " 
+	       << "U3:"<<_bigramVerfSum   << " n:"<<b<< endl;
+	}
+      if(b>0.000001)
+	{
+	  
+	  
+	  if(verboseMode>1 )
+	    cout <<  "  NEU: " <<_nWords*log( u1 * u2 / b ) << endl;
+	  bewertung -= _nWords*log( u1 * u2 / b );
+	  if(verboseMode>1)
+	    cout << "SCHLUSSBEWERTUNG: " << bewertung << endl;
+	}
+      else
+	cout << "B zu klein " << b << endl;
+      }
+      break;
+    case CRITERION_LO:
+      for(c1=0;c1<nKats;c1++)
+	{
+	  for(c2=0;c2<nKats;c2++)
+	    bewertung-=_n[c1][c2]*kat_mlog(_n[c1][c2]-1-rhoLo);
+	  bewertung+=_n1[c1]*kat_mlog(_n1[c1]-1)+_n2[c1]*kat_mlog(_n2[c1]-1);
+	}
+      bewertung-=kat_etaFkt(eta0,eta1,(c1_0*nKats+c2_0*nKats-c1_0*c2_0),nKats);
+      break;
+    default:
+      cerr << "Error: wrong criterion " << auswertung << endl;
+      exit(1);
+    }
+  return bewertung;
+}
+
+double KategProblemKBC::myCriterionTerm()
+{
+  iassert( withVerfaelschung );
+  double r;
+      double u1=_unigramVerfSum1-verfInit0*c1_0;
+      double u2=_unigramVerfSum2-verfInit0*c2_0;
+      double b=_bigramVerfSum-verfInit0*(c1_0*nKats+c2_0*nKats-c1_0*c2_0);
+  
+  
+  if( verboseMode>1 )
+    {
+      cout << "nwords divisor:"<<_nWords << " " << u1 * u2 / b << endl;
+      cout << "ergebnis:      "<<_nWords*log( u1 * u2 / b ) << endl;
+      cout << "0:             "<<c1_0 << endl;
+    }
+  r       = _nWords*log( u1 * u2 / b );
+  
+  return -r;
+}
+
+
+
+
+double KategProblemKBC::bigramVerfSum()
+{
+  double sum=0;
+  for(int c1=0;c1<nKats;c1++)
+    for(int c2=0;c2<nKats;c2++)
+      sum+=nverf(c1,c2);
+  cout << "BIGRAMVERFSUM: " << sum << endl;
+  return sum;
+}
+
+double KategProblemKBC::unigramVerfSum1()
+{
+  double sum=0;
+  for(int c1=0;c1<nKats;c1++)
+    sum+=n1verf(c1);
+  cout << "UNIGRAMVERFSUM1: " << sum << endl;
+  return sum;
+}
+
+double KategProblemKBC::unigramVerfSum2()
+{
+  double sum=0;
+  for(int c1=0;c1<nKats;c1++)
+    sum+=n2verf(c1);
+  cout << "UNIGRAMVERFSUM2: " << sum << endl;
+ return sum;
+}
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblemKBC.h
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblemKBC.h
@ -0,0 +1,157 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+
+
+
+#ifndef KATEGPROBLEMKBC_H
+#define KATEGPROBLEMKBC_H
+
+typedef Array<FreqType> FreqArray;
+typedef Array<double> FreqArrayReal;
+
+
+double verfaelsche(int a,double b);
+double verfaelsche(double a,double b);
+
+class KategProblemKBC
+
+
+{
+ friend class KategProblem;
+
+ private:
+  Array<FreqArray> _n; 
+  Array<FreqType> _n1;      
+                       
+  Array<FreqType> _n2;      
+                       
+			
+  double sigmaVerfaelschung;
+  short withVerfaelschung;
+
+  Array<FreqArrayReal> _nverf;
+  Array<double> _n1verf;
+  Array<double> _n2verf;
+  FreqType _nWords;
+
+ protected:
+  int eta0;            
+  int eta1;            
+  int c1_0;            
+  int c2_0;            
+  double _bigramVerfSum;
+  double _unigramVerfSum1;
+  double _unigramVerfSum2;
+  double verfInit0;
+
+ public:
+  int nKats;           
+
+  KategProblemKBC(int nKats,double sv);
+  
+
+  double fullBewertung(int auswertung);
+  
+
+  FreqType n(int w1,int w2) { return _n[w1][w2]; };
+  
+
+  FreqType n1(int w) { return _n1[w];};
+  
+
+  FreqType n2(int w) { return _n2[w];};
+  
+  
+  double bigramVerfSum();
+  double unigramVerfSum1();
+  double unigramVerfSum2();
+
+  double nverf(int w1,int w2) { return _nverf[w1][w2]; }
+  
+  double n1verf(int w) { return _n1verf[w]; };
+
+  double n2verf(int w) { return _n2verf[w]; };
+
+  inline void addN(int w1,int w2, FreqType n);
+  
+
+  void setN(int w1,int w2, FreqType n);  
+  
+  
+  double myCriterionTerm();
+
+};
+
+inline void KategProblemKBC::addN(int w1,int w2, FreqType n)    
+{
+  if(n!=0)
+    {
+      FreqType &s= _n[w1][w2];
+      if(s==0)
+	eta0--;
+      else if(s==1)
+	eta1--;
+      if(_n1[w1]==0)
+	c1_0--;
+      if(_n2[w2]==0)
+	c2_0--;
+      
+      if(withVerfaelschung)
+	{
+	  double verfOld=verfaelsche(s,sigmaVerfaelschung);
+	  double verfNew=verfaelsche(s+n,sigmaVerfaelschung);
+	  double verfOld1=verfaelsche(_n1[w1],sigmaVerfaelschung);
+	  assert(verfOld1==_n1verf[w1]);
+	  double verfNew1=verfaelsche(_n1[w1]+n,sigmaVerfaelschung);
+	  double verfOld2=verfaelsche(_n2[w2],sigmaVerfaelschung);
+	  assert(verfOld2==_n2verf[w2]);
+	  double verfNew2=verfaelsche(_n2[w2]+n,sigmaVerfaelschung);
+	  _n1verf[w1]=verfNew1;
+	  _unigramVerfSum1+=verfNew1-verfOld1;
+	  _n2verf[w2]=verfNew2;
+	  _unigramVerfSum2+=verfNew2-verfOld2;
+	  _nverf[w1][w2]=verfNew;
+	  _bigramVerfSum+=verfNew-verfOld;
+	  _nWords+=n;
+	}
+      s+=n;_n1[w1]+=n;_n2[w2]+=n; 
+
+      assert(_n[w1][w2]>=0);
+      assert(_n1[w1]>=0);
+      assert(_n2[w2]>=0);
+      
+      if(s==0)
+	eta0++;
+      else if(s==1) 
+	eta1++;
+      if(_n1[w1]==0)
+	c1_0++;
+      if(_n2[w2]==0)
+	c2_0++;
+    }
+};
+#endif
--- a/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblemTest.cpp
+++ b/mgiza-aligner/mgiza/experimental/alignment-enabled/MGIZA/src/mkcls/KategProblemTest.cpp
@ -0,0 +1,700 @@
+/*
+
+Copyright (C) 1997,1998,1999,2000,2001  Franz Josef Och
+
+mkcls - a program for making word classes .
+
+This program is free software; you can redistribute it and/or
+modify it under the terms of the GNU General Public License
+as published by the Free Software Foundation; either version 2
+of the License, or (at your option) any later version.
+
+This program is distributed in the hope that it will be useful, 
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+GNU General Public License for more details.
+
+You should have received a copy of the GNU General Public License
+along with this program; if not, write to the Free Software
+Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, 
+USA.
+
+*/
+
+
+
+
+#include "KategProblemTest.h"
+
+#include "ProblemTest.h"
+#include "HCOptimization.h"
+#include "TAOptimization.h"
+#include "RRTOptimization.h"
+#include "GDAOptimization.h"
+
+#include <cstdlib>
+#include <cstdio>
+#include <string>
+#include <strstream>
+
+typedef pair<string,string> PSS;
+
+#define NEW_SENTENCE_END "mkcls-mapped-dollar-symbol-$"
+
+#ifdef NeXT
+char *strdup(char *a)
+{
+  char *p = (char *)malloc(strlen(a)+1);
+  strcpy(p,a);
+  return p;
+}
+
+#endif
+
+
+void writeClasses(Array<Kategory> &katOfWord,KategProblem &problem,ostream &to)
+{	    
+  for(int i=0;i<katOfWord.size();i++)
+    {
+      if( strcmp(problem.getString(i),"$") )
+	if( strcmp(problem.getString(i),"mkcls-mapped-dollar-symbol-$")==0 )
+	  to << "$" << "\t" << katOfWord[i] << endl;
+	else
+	  to << problem.getString(i) << "\t" << katOfWord[i] << endl;
+    }
+}
+
+
+void mysplit(const string &s,string &s1,string &s2)
+{
+  unsigned int i=0;
+  for(;i<s.length();i++)if( s[i]==' ' || s[i]=='\t' || s[i]==' ')break;
+  s1=s.substr(0,i);
+  for(;i<s.length();i++)if( !(s[i]==' ' || s[i]=='\t' || s[i]==' ') )break;  
+  s2=s.substr(i,s.length()-i);
+  
+  iassert(s1.size());
+  iassert(s2.size());
+}
+
+
+
+int fromCatFile(KategProblem *p,const char *fname,bool verb)
+{
+  leda_h_array<string,int> translation(-1);
+  int maxCat=2;
+  ifstream in(fname);
+  if(!in)
+    {
+      cerr << "Error: File '" << fname << "' cannot be opened.\n";
+      exit(1);
+    }
+  for(int i=0;i<p->wordFreq.nWords;i++)
+    (p->initLike)[i]= -1;
+  
+  
+  translation["1"]=1;
+  translation["0"]=0;
+
+  
+  string s;
+  while( getline(in,s) ) 
+    {
+      string str,categ;
+      mysplit(s,str,categ);
+      int i=p->words->binary_locate(str);
+      if(i>=0 && (*(p->words))[i]==str )
+	{
+	  
+	  if( translation[categ]==-1 )
+	    translation[categ]=maxCat++;
+	  int cat=translation[categ];
+	  if( (p->initLike)[i]!= -1 )
+	    cerr << "Warning: Word '" << ((*(p->words))[i])<< "' is already in a category.\n";
+	  (p->initLike)[i]=cat;
+	}
+      else
+	cerr << "Warning: Word '" << str << "' " << i << " is not in training corpus.\n";
+    }
+  
+  if( verboseMode )
+    cout << "We have " << maxCat << " read non-empty categories" 
+      " (with words from the corpus).\n";
+  
+  if(maxCat>p->katFreq.nKats)
+    {
+      cerr << "Error: Not enough categories reserved (only " 
+	   << p->katFreq.nKats << ", but i need " << maxCat << ").\n";
+      exit(1);
+    }
+  
+  
+  int i=p->words->binary_locate("$");
+  if( i>=0 &&  (*(p->words))[i]=="$" )
+    (p->initLike)[i]=0;
+  else
+    if( verboseMode )
+      cerr << "Warning: No '$' in vocabulary!\n";
+  
+  
+  int errors=0;
+  for(i=0;i<p->wordFreq.nWords;i++)
+    if((p->initLike)[i]== -1 )
+      {
+	if( verb ) cerr << "Error: I don't know the category of word " << i 
+	     << " (" << (*(p->words))[i] << ") " << ".\n";
+	errors=1;
+      }
+  return errors;
+}
+
+
+
+KategProblem *makeKategProblem(const leda_h_array<PSS,FreqType>&cTbl,const leda_set<string>&setVokabular, int maxClass,int initialisierung,
+			 int auswertung,int nachbarschaft,int minWordFrequency)
+{
+  
+  int nwrd=0;
+  leda_array<string>&sVok = *new leda_array<string>(setVokabular.size());
+  string s;
+  unsigned int ctr=0;
+  forall_set(leda_set<string>,s,setVokabular)
+    {
+      if( verboseMode>2 )
+	cout << "mkcls:Wort " << ctr << " " << s << endl;
+      sVok[ctr++]=s;
+    }
+  for(unsigned int z=0;z<ctr-1;z++)
+    iassert( sVok[z]<sVok[z+1] );
+  sVok.sort();
+
+  if( verboseMode>2 )
+    cout << "*****Vocabulary: " << sVok;
+  
+  unsigned int vokSize=sVok.size();
+  massert(vokSize==ctr); massert(vokSize==setVokabular.size());
+  if(verboseMode)
+    {cout << "Size of vocabulary: " << vokSize << "\n";cout.flush();}
+  
+  KategProblem *k = new KategProblem(vokSize,maxClass,initialisierung,
+				     auswertung,nachbarschaft,minWordFrequency);
+  KategProblemWBC &w=k->wordFreq;
+  k->words=&sVok;
+  
+  Array<int> after(vokSize,0);
+  Array<int> before(vokSize,0);
+  
+  
+  nwrd=0;
+  {
+    PSS s;
+    forall_defined_h2(PSS,FreqType,s,cTbl)
+      {
+	const string&ss1=s.first;
+	const string&ss2=s.second;
+	if( ss2.length()&&(ss1!="$" || ss2!="$") )
+	  {
+	    int i1=sVok.binary_search(ss1);
+	    int i2=sVok.binary_search(ss2);
+	    iassert( sVok[i1] == ss1 );iassert( sVok[i2] == ss2 );
+	    after[i1]++;
+	    before[i2]++;
+	  }
+	if( verboseMode&&((nwrd++)%10000==0) ) 
+	  {cout<<"Statistiken-1 " << nwrd<< ".      \r";cout.flush();}
+      }
+  }
+  
+  for(unsigned int i=0;i<vokSize;i++)
+    {
+      w.setAfterWords(i,after[i]);
+      w.setBeforeWords(i,before[i]);
+    }
+  
+  
+  {
+    nwrd=0;
+    PSS s;
+    forall_defined_h2(PSS,FreqType,s,cTbl)
+      {
+	const string&ss1=s.first;
+	const string&ss2=s.second;
+	FreqType p=cTbl[s];
+	if( ss2.length()&&(ss1!="$" || ss2!="$") )
+	  {
+	    int i1=sVok.binary_search(ss1);
+	    int i2=sVok.binary_search(ss2);
+	    iassert( sVok[i1] == ss1 );iassert( sVok[i2] == ss2 );
+	    w.setFreq(i1,i2,p);
+	    if( verboseMode>2 )
+	      cout << "BIGRAMM-HAEUF: " << ss1 << ":" << i1 << "   " 
+		   << ss2 << ":" << i2 << "   " << p << endl;
+	  }
+ 	if( verboseMode&&((nwrd++)%10000==0) ) 
+	  {cout<<"Statistiken-2 " <<nwrd<< ".    \r";cout.flush();}
+     }
+  }
+  
+  w.testFull();
+  if(verboseMode){cout << "Datenintegritaet getestet.\n";cout.flush();}
+  return k;
+}
+
+KategProblem *fromNgrFile(const char *str,int maxClass,int initialisierung,
+			 int auswertung,int nachbarschaft,int minWordFrequency)
+{
+  ifstream file(str);
+  if(!file)return 0;
+  leda_set<string> setVokabular;
+  leda_h_array<PSS,FreqType> cTbl;
+  double c=0;
+  if( verboseMode )cout << "NGRFILE: " << str << endl;
+  string s1,s2;
+  while(file >> c >> s1 >> s2)
+    {
+      if( s1.length()==0||s2.length()==0 )
+	{
+	  cerr << "ERROR: strings are zero: " << s1.length() <<" " << s1 <<" " << s2.length()<<" " << s2 << endl;
+	  return 0;
+	}
+      if( c==0 )
+	{
+	  cerr << "Count ist 0 " << s1 << " " << s2 << endl;
+	  return 0;
+	}
+      cTbl[pair<string,string>(s1,s2)]=(FreqType)c;
+      setVokabular.insert(s1);
+      setVokabular.insert(s2);
+      if( verboseMode>1 )
+	cout << "R: " << s1 << " " << s2 << " " << c << endl;
+      c=0;
+    }
+  
+  return makeKategProblem(cTbl,setVokabular,maxClass,initialisierung,auswertung,nachbarschaft,minWordFrequency);
+}
+
+
+
+	
+
+	
+
+
+KategProblem *fromKModel(const char *str,int maxClass,int initialisierung,
+			 int auswertung,int nachbarschaft,int minWordFrequency)
+{
+  string oldText,text,line;
+  ifstream f(str);
+  if( !f )
+    {
+      cerr << "ERROR: can not open file " << str << ".\n";
+      return 0;
+    }
+  
+  leda_set<string> setVokabular;
+  leda_h_array<PSS,FreqType> cTbl(0);
+  oldText="$";
+  while(1)
+    {
+      getline(f,line);
+      if(f.fail() && !f.bad() && !f.eof())
+	{
+	  cerr << "WARNING: strange characters in stream (getline) " << endl;f.clear();
+	}
+      if(!f)break;
+      
+      istrstream f2(line.c_str());
+      while( 1 )
+	{
+	  f2 >> text;
+	  if(f2.fail() && !f2.bad() && !f2.eof())
+	    {
+	      cerr << "WARNING: strange characters in stream (>>) !\n";
+	      f2.clear(ios::failbit);
+	    }
+	  if(!f2){break;}
+	  
+	    
+	    
+	    
+	    
+	    
+	  if( text == "$" )
+	    text = "mkcls-mapped-dollar-symbol-$";
+	  if( !setVokabular.member(text) )setVokabular.insert(text);
+	  cTbl[pair<string,string>(oldText,text)]++;
+	  oldText=text;
+	}
+      text="$";
+      if( !setVokabular.member(text) )setVokabular.insert(text);
+      cTbl[pair<string,string>(oldText,text)]++;
+      oldText=text;
+    }
+  return makeKategProblem(cTbl,setVokabular,maxClass,initialisierung,auswertung,nachbarschaft,minWordFrequency);
+}
+ 
+
+
+
+
+void KategProblemSetParameters(KategProblem &p)
+{
+  if( p.katwahl()==K_BEST )
+    {
+      TAOptimization::defaultAnnRate=0.7;
+      RRTOptimization::defaultAnnRate=0.95;
+      GDAOptimization::defaultAlpha=0.05;
+      if( verboseMode )
+	cout << "Parameter-setting like W-DET-BEST\n";
+    }
+  else
+    {
+      TAOptimization::defaultAnnRate=0.4;
+      RRTOptimization::defaultAnnRate=0.6;
+      GDAOptimization::defaultAlpha=0.0125;
+      if( verboseMode )
+	cout << "Parameter-setting like W-DET-DET\n";
+    }
+}
+
+
+
+
+KategProblem &makRandom(int ANZ_WORD,int ANZ_CLS,int initValue,
+			int auswertung,int nachbarschaft,float relInit)
+{
+  KategProblem &k=
+    *new KategProblem(ANZ_WORD,ANZ_CLS,initValue,auswertung,nachbarschaft);
+  KategProblemWBC &w=k.wordFreq;
+  Array<int> after(ANZ_WORD,0);
+  Array<int> before(ANZ_WORD,0);
+  Array<FreqArray> twoD(ANZ_WORD);
+	int i;
+  for(i=0;i<ANZ_WORD;i++) twoD[i].init(ANZ_WORD,0); 
+  
+  for(i=0;i<ANZ_WORD;i++)
+    {
+      massert(after[i]==0);
+      massert(before[i]==0);
+      for(int j=0;j<ANZ_WORD;j++)
+	{
+	  massert(twoD[i][j]==0);
+	}
+    }
+  for(i=0;i<ANZ_WORD*ANZ_WORD*relInit;i++)
+    {
+      int x=randomInt(ANZ_WORD);
+      int y=randomInt(ANZ_WORD);
+      if(twoD[x][y]==0)
+	{
+	  after[x]++;
+	  before[y]++;
+	}
+      twoD[x][y]+=randomInt(10)+1;
+    }
+  for(i=0;i<ANZ_WORD;i++)
+    {
+      w.setAfterWords(i,after[i]);
+      w.setBeforeWords(i,before[i]);
+    }
+  
+  for(i=0;i<ANZ_WORD;i++)
+    {
+      for(int j=0;j<ANZ_WORD;j++)
+	if( twoD[i][j] )
+	    w.setFreq(i,j,twoD[i][j]);
+    }
+  w.testFull();
+  return k;
+}
+
+
+
+
+char *makeTitle(KategProblem &problem,int verfahren)
+{
+  char x[1024];
+  switch(verfahren)
+    {
+    case HC_OPT:
+      strcpy(x,"HC   ");
+      break;
+    case SA_OPT:
+      strcpy(x,"SA     ");
+      break;
+    case TA_OPT:
+      strcpy(x,"TA     ");
+      break;
+    case GDA_OPT:
+      strcpy(x,"GDA    ");
+      break;
+    case RRT_OPT:
+      strcpy(x,"RRT    ");
+      break;
+    }
+  problem.makeTitle(x+strlen(x));
+  return strdup(x);
+}
+
+
+
+
+#define MAX_MULTIPLE 10  
+
+Array<KategProblem *> &_izrOptimization(Array<KategProblem *> &probs,
+int anzprob,double timeForOneRed,double maxClock,Array<Kategory> &katOfWord,
+int anzIter,int verfahren)
+{
+  massert(anzprob>1);
+  massert(probs[0]->wordFreq.mindestAnzahl<=1);
+  KategProblem *p0=probs[0];
+
+  int nWords=p0->wordFreq.nWords;
+  int nKats=p0->katFreq.nKats;
+  int minimumNumberOfWords = max(1,int(nWords*0.95));
+
+  int indexOfDurchschnitt;
+  Array<int> newWords(nWords);
+  int useAnzprob=anzprob;
+  do
+    {
+      int w,k;
+      indexOfDurchschnitt=0;
+      for(w=0;w<nWords;w++)
+	newWords[w]=-1;
+      for(k=0;k<useAnzprob;k++)
+	{
+	  massert(probs[k]->wordFreq.nWords==nWords);
+	  probs[k]->makeKats();
+	}
+      
+      for(w=0;w<nWords;w++)
+	{
+	  if( newWords[w]==-1 )
+	    {
+	      
+	      
+	      
+	      leda_set<int> durchschnitt=(*p0->kats)[p0->katOfWord(w)];
+	      for(k=1;k<useAnzprob;k++)
+	      durchschnitt = durchschnitt & (*probs[k]->kats)[probs[k]->katOfWord(w)];
+	      
+	      
+	      int _anzInDurchschnitt=0;
+	      int nr=0;
+	      forall_set(leda_set<int>,nr,durchschnitt)
+		{
+		  _anzInDurchschnitt++;
+		  newWords[nr]=indexOfDurchschnitt;
+		}
+	      if( verboseMode && _anzInDurchschnitt>1 && anzIter==0 )
+		{
+		  cout << "- (";
+		    forall_set(leda_set<int>,nr,durchschnitt)
+		    {
+		      cout << p0->getString(nr);
+		      if( p0->wordFreq.n1(nr)==1 )
+			cout << "* ";
+		      else
+			cout << " ";
+		    }
+		  cout << ")\n";
+		}
+	      
+	      
+	      
+	      
+	      for(k=0;k<useAnzprob;k++)
+		{
+		  durchschnitt = durchschnitt - (*probs[k]->kats)[probs[k]->katOfWord(w)];
+		}
+	      indexOfDurchschnitt++;
+	    }
+	}
+      
+    if(indexOfDurchschnitt>=minimumNumberOfWords)
+	{
+	  if(useAnzprob==1)
+	    {
+	      cout << "useAnzProb==1 => mysterious.\n";
+	      break;	
+	    }
+	  useAnzprob--;
+	}
+    }
+  while(indexOfDurchschnitt>=minimumNumberOfWords);
+  
+  
+  Array<KategProblem *> &neu=*new Array<KategProblem *>(MAX_MULTIPLE*anzprob,(KategProblem *)0);
+  qsort(probs.getPointerToData(),useAnzprob,sizeof(KategProblem *),compareProblem);
+  massert(useAnzprob<=probs.size());
+  double startTime=clockSec();
+  int i, numberOfNew;
+  for(numberOfNew=0; (clockSec()-startTime<timeForOneRed) 
+                         || (numberOfNew < anzprob) ; numberOfNew++)
+    {
+      int w;
+      if( numberOfNew==anzprob*MAX_MULTIPLE-1 )
+	break;
+      KategProblem *p 
+	= neu[numberOfNew] 
+	  = new KategProblem(indexOfDurchschnitt,nKats-2,
+		          p0->initialisierung,p0->auswertung,p0->nachbarschaft);
+
+      for(w=0;w<indexOfDurchschnitt;w++)
+	{
+	  p->wordFreq.setAfterWords(w,5);
+	  p->wordFreq.setBeforeWords(w,5);
+	}
+      for(w=0;w<nWords;w++)
+	{
+	  Array<OneFreq> &after=p0->wordFreq.after[w];
+	  int size=after.size();
+	  for(i=0;i<size;i++)
+	    p->wordFreq.addFreq(newWords[w],newWords[after[i].w],after[i].n);
+	}
+      p->wordFreq.testFull(1);
+      
+      
+      
+      
+      
+      
+      p->wordFreq.set_h_of_words(p0->wordFreq.get_h_of_words());
+      double w1=0.0,w2=0.0;
+      if(numberOfNew<useAnzprob)
+	{
+	  
+	  for(i=0;i<nWords;i++)
+	    (p->initLike)[newWords[i]]=probs[numberOfNew]->katOfWord(i);
+	  p->_initialize(5);
+	  HCOptimization hc(*p,-1);
+	  if(verboseMode)
+	    {
+	      w1=p->nicevalue();
+	      cout << "from old category system:" << w1 << endl;
+	    }
+	  hc.minimize(-1);
+	  if(verboseMode)
+	    {
+	      w2=p->nicevalue();
+	      if(w2<w1)
+		cout << "improvement: " << w1-w2 << endl;
+	    }
+	}
+      else
+	{
+	  p->_initialize(1);
+	  double mean;
+	  StatVar end,laufzeit,start;
+	  solveProblem(0,*p,1,-1,verfahren,mean,end,laufzeit,start);
+	  w2=p->value();
+	  if(verboseMode)
+	      cout << "new category system: " << w2 << " (" << p->nicevalue() 
+		<< ") Zeit: " << clockSec() << "\n";
+	}
+    }
+	int p;
+  for(p=0;p<probs.size();p++)
+    {
+      if( probs[p] )
+	delete probs[p];
+    }
+  qsort(neu.getPointerToData(),numberOfNew,sizeof(Problem *),compareProblem);
+  massert(numberOfNew<=neu.size());
+  if( verboseMode )
+    cout << "Iterierte Zustandsraum-Reduktion: " << indexOfDurchschnitt 
+      << " words. costs: " << neu[0]->value() << " " 
+      << neu[0]->nicevalue() << " (" << numberOfNew-anzprob << ")" << "time: " 
+      << clockSec() << endl;
+  if( indexOfDurchschnitt<=nKats 
+      || (clockSec()>maxClock&&maxClock) )
+    {
+      if( clockSec()>maxClock&&maxClock )
+	cout << "STOP (time limit: " << (clockSec()-maxClock) << " s)\n";
+      for(i=0;i<nWords;i++)
+	katOfWord[i]=neu[0]->katOfWord(newWords[i]);
+      return neu;
+    }
+  else
+    {
+      Array<Kategory> &newKatOfWord=
+       *(new Array<Kategory>(neu[0]->wordFreq.nWords,-1));
+      Array<KategProblem *> &erg=_izrOptimization(neu,anzprob,timeForOneRed,
+						  maxClock,newKatOfWord,
+						  anzIter+1,verfahren);
+      for(i=0;i<nWords;i++)
+	katOfWord[i]=newKatOfWord[newWords[i]];
+      return erg;
+    }
+}
+
+
+
+
+KategProblem *izrOptimization(KategProblem &p,int minN,int firstN,
+			      double clockForOneRed,double maxClock,int verfahren)
+{
+  Array<Kategory> katOfWord(p.wordFreq.nWords,-1);
+  int startN;
+  if( clockForOneRed<=0 )
+    startN=firstN;
+  else
+    startN=1000;
+  Array<KategProblem *> probs(startN);
+  double val1=0.0,val2=0.0;
+  double endTime=-1;
+
+  double startTime=clockSec();
+  int i;
+  for(i=0;i<startN;i++)
+    {
+      StatVar end,laufzeit,start;
+      double mean;
+      probs[i] = (KategProblem *)((KategProblem *)p.makeEqualProblem());
+      solveProblem(0,*(probs[i]),1,-1,verfahren,mean,end,laufzeit,start);
+      if( i==minN-1 )
+	endTime = clockSec();
+      if( i>=firstN-1 && (startTime+clockForOneRed>clockSec() || i==999) )
+	break;
+    }
+  if( endTime<0 )
+    endTime=clockSec();
+  massert(i>=firstN);
+
+  qsort(probs.getPointerToData(),i,sizeof(KategProblem *),compareProblem);
+  massert(i<=probs.size());
+  if( clockForOneRed<=0 )
+    {
+      clockForOneRed=endTime-startTime;
+      if( verboseMode )
+	cout << "time for one reduction: " << clockForOneRed << endl;
+    }
+  _izrOptimization(probs,minN,clockForOneRed,maxClock,katOfWord,0,verfahren);
+  
+  KategProblem *n=(KategProblem *)(p.makeEqualProblem());
+  n->initLike= katOfWord;
+  n->_initialize(5);
+  if( verboseMode )
+    val1=n->value();
+  HCOptimization hc(*n,-1);
+  hc.minimize(-1);
+  val2=n->value();
+  if( verboseMode )
+    cout << "last improvement: " << val2-val1 << "\n";
+  cout << "final costs: " << val2 << " " << n->nicevalue() << endl;
+  if(PrintBestTo)
+    n->dumpOn(*PrintBestTo);
+  return n;
+}
+
+
+
+
+
+
+
+
+
+
+
--- a/Show More
+++ b/Show More
				`@ -0,0 +1,2 @@`
				`sed -e 's/^[ \t]//' -e 's/[ \t][ \t]/ /g' -e 's/[ \t]*$//'`