resolve conflicts

author: Marcin Junczys-Dowmunt <marcinjd@microsoft.com> 2022-02-06 23:33:58 +0300
committer: Marcin Junczys-Dowmunt <marcinjd@microsoft.com> 2022-02-06 23:33:58 +0300
commit: 3cf9e83bac033a80c7b27912435917d65e40f095 (patch)
tree: 78ff005463dc4334854d7b4980260b345777b9f6
parent: 8da539e835e8661d00697c8bd01164e64ab9ce62 (diff)
parent: e8ea37cd5b85e3df817b9ced68bef9cc64b45d16 (diff)
3 files changed, 8 insertions, 21 deletions
diff --git a/CHANGELOG.md b/CHANGELOG.md
index d42c652e..cf0f3844 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -9,7 +9,11 @@ and this project adheres to [Semantic Versioning](http://semver.org/spec/v2.0.0.
 ## [Unreleased]
 
 ### Added
-- Adds option --add-lsh to marian-conv which allows the LSH to be memory-mapped.
+- Parallelized data reading with e.g. `--data-threads 8`
+- Top-k sampling during decoding with e.g. `--output-sampling topk 10`
+- Improved mixed precision training with `--fp16`
+- Set FFN width in decoder independently from encoder with e.g. `--transformer-dim-ffn 4096 --transformer-decoder-dim-ffn 2048`
+- Adds option `--add-lsh` to marian-conv which allows the LSH to be memory-mapped.
 - Early stopping based on first, all, or any validation metrics via `--early-stopping-on`
 - Compute 8.6 support if using CUDA>=11.1
 - Support for RMSNorm as drop-in replace for LayerNorm from `Biao Zhang; Rico Sennrich (2019). Root Mean Square Layer Normalization`. Enabled in Transformer model via `--transformer-postprocess dar` instead of `dan`.
diff --git a/VERSION b/VERSION
index 60c73ff4..e4afc5eb 100644
--- a/VERSION
+++ b/VERSION
@@ -1,2 +1 @@
-v1.10.28
-
+v1.10.42
diff --git a/src/data/corpus_base.cpp b/src/data/corpus_base.cpp
index 20301103..636752c9 100644
--- a/src/data/corpus_base.cpp
+++ b/src/data/corpus_base.cpp
@@ -566,23 +566,7 @@ size_t CorpusBase::getNumberOfTSVInputFields(Ptr<Options> options) {
   return 0;
 }
 
-<<<<<<< HEAD
-void SentenceTuple::setWeights(const std::vector<float>& weights) {
-  if(weights.size() != 1) {  // this assumes a single sentence-level weight is always fine
-    ABORT_IF(empty(), "Source and target sequences should be added to a tuple before data weights");
-    auto numWeights = weights.size();
-    auto numTrgWords = back().size();
-    // word-level weights may or may not contain a weight for EOS tokens
-    if(numWeights != numTrgWords && numWeights != numTrgWords - 1)
-      LOG(warn,
-          "[warn] "
-          "Number of weights ({}) does not match the number of target words ({}) in line #{}",
-          numWeights,
-          numTrgWords,
-          id_);
-  }
-  weights_ = weights;
-=======
+#if 0
 // experimental: hide inline-fix source tokens from cross attention
 std::vector<float> SubBatch::crossMaskWithInlineFixSourceSuppressed() const
 {
@@ -630,8 +614,8 @@ std::vector<float> SubBatch::crossMaskWithInlineFixSourceSuppressed() const
     ABORT_IF(batchWords() != 0/*n/a*/ && numWords != batchWords(), "batchWords() inconsistency??");
   }
   return m;
->>>>>>> master
 }
+#endif
 
 }  // namespace data
 }  // namespace marian
author	Marcin Junczys-Dowmunt <marcinjd@microsoft.com>	2022-02-06 23:33:58 +0300
committer	Marcin Junczys-Dowmunt <marcinjd@microsoft.com>	2022-02-06 23:33:58 +0300
commit	3cf9e83bac033a80c7b27912435917d65e40f095 (patch)
tree	78ff005463dc4334854d7b4980260b345777b9f6
parent	8da539e835e8661d00697c8bd01164e64ab9ce62 (diff)
parent	e8ea37cd5b85e3df817b9ced68bef9cc64b45d16 (diff)