Skip to content

Commit 59397a5

Browse files
authored
Fix failing on some models (#20)
1 parent 398675f commit 59397a5

File tree

7 files changed

+37
-15
lines changed

7 files changed

+37
-15
lines changed

3rd_party/crow

Submodule crow updated 92 files

3rd_party/moz-bergamot-translator

Dockerfile

Lines changed: 5 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,6 +24,11 @@ RUN sh -c 'echo deb https://apt.repos.intel.com/mkl all main > /etc/apt/sources.
2424
apt-get update && \
2525
apt-get install -y intel-mkl-64bit-2020.0-088
2626

27+
# attempt to use openblas
28+
#RUN apt search openblas
29+
#RUN apt install -y libopenblas-dev
30+
#RUN update-alternatives --config libblas.so.3
31+
2732
# Bergamot
2833
# pcre2 is requried to build berrgamot-translator with -DUSE_WASM_COMPATIBLE_SOURCES=off
2934
RUN apt-get install -y libpcre2-dev

Makefile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ run:
1616
docker run --name translation-service -it --rm -v $$(pwd)/models:/models -p 8080:8080 -e PORT=8080 translation-service
1717

1818
debug:
19-
docker run --name translation-service -it --rm -v $$(pwd):/app -v $$(pwd)/models:/models -p 8080:8080 translation-service bash
19+
docker run --name translation-service -it --rm -v $$(pwd):/app -v $$(pwd)/models:/models -e PORT=8080 -p 8080:8080 translation-service bash
2020

2121
call:
2222
curl --header "Content-Type: application/json" \

scripts/download-test-models.sh

Lines changed: 17 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -1,24 +1,32 @@
11
#!/bin/bash
22

3+
version=0.3.0
4+
35
mkdir models
46
cd models
57

68
mkdir esen
79
mkdir enet
810
mkdir enru
11+
mkdir enbg
912

1013
cd esen
11-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/esen/lex.50.50.esen.s2t.bin
12-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/esen/model.esen.intgemm.alphas.bin
13-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/esen/vocab.esen.spm
14+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/esen/lex.50.50.esen.s2t.bin
15+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/esen/model.esen.intgemm.alphas.bin
16+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/esen/vocab.esen.spm
1417

1518
cd ../enet
16-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/enet/lex.50.50.enet.s2t.bin
17-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/enet/model.enet.intgemm.alphas.bin
18-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/enet/vocab.eten.spm
19+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enet/lex.50.50.enet.s2t.bin
20+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enet/model.enet.intgemm.alphas.bin
21+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enet/vocab.eten.spm
1922

2023

2124
cd ../enru
22-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/enru/lex.50.50.enru.s2t.bin
23-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/enru/model.enru.intgemm.alphas.bin
24-
wget https://storage.googleapis.com/bergamot-models-sandbox/0.2.10/enru/vocab.enru.spm
25+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enru/lex.50.50.enru.s2t.bin
26+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enru/model.enru.intgemm.alphas.bin
27+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enru/vocab.enru.spm
28+
29+
cd ../enbg
30+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enbg/lex.50.50.enbg.s2t.bin
31+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enbg/model.enbg.intgemm.alphas.bin
32+
wget https://storage.googleapis.com/bergamot-models-sandbox/${version}/enbg/vocab.bgen.spm

src/translation.h

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -107,13 +107,14 @@ namespace marian {
107107
"\nmini-batch-words: 1024"
108108
"\nworkspace: 128"
109109
"\nmax-length-factor: 2.0"
110-
"\nskip-costls: True"
110+
"\nskip-cost: True"
111111
"\nquiet: True"
112112
"\nquiet-translation: True"
113-
"\ngemm-precision: int8shift";
113+
"\ngemm-precision: int8shift"
114+
"\nalignment: soft";
114115

115116
options = options + "\nmodels: [" + modelPath + "]\nvocabs: [" + vocabPath + ", " + vocabPath +
116-
"]\nshortlist: [" + shortlistPath + ", 50, 50]";
117+
"]\nshortlist: [" + shortlistPath + ", false]";
117118

118119
return options;
119120
}

tests/integration/test_api.py

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -44,6 +44,14 @@ def test_non_latin():
4444
assert translation == 'Как дела?' or translation == 'Как у тебя дела?'
4545

4646

47+
def test_different_shortlist():
48+
query = {"from": "en", "to": "bg", "text": 'Hello world'}
49+
50+
resp = requests.post(url + '/v1/translate', json=query)
51+
52+
assert resp.status_code == 200
53+
assert resp.json()['result'] == 'Здравей свят'
54+
4755
def test_json_escaping():
4856
query = {"from": "es", "to": "en", "text": '"Hola Mundo"'}
4957

0 commit comments

Comments
 (0)