embedding : adjust n_ubatch value (ggml-org#6296)

mscheong01 · ngxson · web-flow · commit deb7240100da · 2024-03-26T11:11:46.000+02:00
* embedding: assign `n_ubatch` value, print error on `n_batch` overflow * Update examples/embedding/embedding.cpp Co-authored-by: Xuan Son Nguyen <thichthat@gmail.com> * use %ld instead of %lld * Revert "use %ld instead of %lld" This reverts commit ea753ed. --------- Co-authored-by: Xuan Son Nguyen <thichthat@gmail.com>
diff --git a/examples/embedding/embedding.cpp b/examples/embedding/embedding.cpp
@@ -61,6 +61,8 @@ int main(int argc, char ** argv) {
     }
 
     params.embedding = true;
+    // For non-causal models, batch size must be equal to ubatch size
+    params.n_ubatch = params.n_batch;
 
     print_build_info();
 
@@ -114,7 +116,9 @@ int main(int argc, char ** argv) {
     for (const auto & prompt : prompts) {
         auto inp = ::llama_tokenize(ctx, prompt, true, false);
         if (inp.size() > n_batch) {
-            inp.resize(n_batch);
+            fprintf(stderr, "%s: error: number of tokens in input line (%lld) exceeds batch size (%lld), increase batch size and re-run\n",
+                    __func__, (long long int) inp.size(), (long long int) n_batch);
+            return 1;
         }
         inputs.push_back(inp);
     }

Original file line number	Diff line number	Diff line change
`@@ -61,6 +61,8 @@ int main(int argc, char ** argv) {`
`61`	`61`	`}`
`62`	`62`
`63`	`63`	`params.embedding = true;`
	`64`	`+ // For non-causal models, batch size must be equal to ubatch size`
	`65`	`+ params.n_ubatch = params.n_batch;`
`64`	`66`
`65`	`67`	`print_build_info();`
`66`	`68`
`@@ -114,7 +116,9 @@ int main(int argc, char ** argv) {`
`114`	`116`	`for (const auto & prompt : prompts) {`
`115`	`117`	`auto inp = ::llama_tokenize(ctx, prompt, true, false);`
`116`	`118`	`if (inp.size() > n_batch) {`
`117`		`- inp.resize(n_batch);`
	`119`	`+ fprintf(stderr, "%s: error: number of tokens in input line (%lld) exceeds batch size (%lld), increase batch size and re-run\n",`
	`120`	`+ __func__, (long long int) inp.size(), (long long int) n_batch);`
	`121`	`+ return 1;`
`118`	`122`	`}`
`119`	`123`	`inputs.push_back(inp);`
`120`	`124`	`}`