latitudegames · Apr 15, 2023
diff --git a/‎.gitignore
+2-1 b/‎.gitignore
+2-1
diff --git a/‎.npmignore
+2 b/‎.npmignore
+2
diff --git a/‎Encoder.js
-178 b/‎Encoder.js
-178
diff --git a/‎Encoder.test.js
-44 b/‎Encoder.test.js
-44
diff --git a/‎data/bpe_ranks.json
+1 b/‎data/bpe_ranks.json
+1
diff --git a/‎encoder.json ‎data/encoder.json b/‎encoder.json ‎data/encoder.json
diff --git a/‎data/getBpe.js
+20 b/‎data/getBpe.js
+20
diff --git a/‎vocab.bpe ‎data/vocab.bpe b/‎vocab.bpe ‎data/vocab.bpe
@@ -1,2 +1,3 @@
 node_modules
-.npmrc
+*.d.ts
+.npmrc
@@ -0,0 +1,2 @@
+.npmrc
+tsconfig.json
@@ -0,0 +1,20 @@
+const path = require("path");
+const fs = require("fs");
+const { dictZip, range } = require("../utils");
+
+const bpe_file = fs.readFileSync(path.join(__dirname, "./vocab.bpe"), "utf-8");
+const lines = bpe_file.split("\n");
+
+const bpe_merges = lines.slice(1, lines.length - 1).map((x) =>
+  x
+    .split(/(\s+)/)
+    .filter((e) => e.trim().length > 0)
+    .join(","),
+);
+
+const bpe_ranks = dictZip(bpe_merges, range(0, bpe_merges.length));
+
+fs.writeFileSync(
+  path.join(__dirname, "./bpe_ranks.json"),
+  JSON.stringify(bpe_ranks),
+);
-Original file line number
+Diff line change
 node_modules
 -.npmrc
 +*.d.ts
 +.npmrc