Tests

ivanstepanovftw · ivanstepanovftw · commit 3bf3a968b6f7 · 2023-04-28T20:36:53.000+03:00
diff --git a/tests/test-sampling.cpp b/tests/test-sampling.cpp
@@ -7,6 +7,9 @@
 #include <vector>
 #include <algorithm>
 
+#undef assert
+#define assert(__expr) do { if (!(__expr)) { printf("%s:%d (%s) %s\n", __FILE__, __LINE__, __func__, #__expr); exit(1); } } while(0)
+
 void dump(const llama_token_data_array * candidates) {
     for (size_t i = 0; i < candidates->size; i++) {
         printf("%d: %f (%f)\n", candidates->data[i].id, candidates->data[i].p, candidates->data[i].logit);
@@ -53,13 +56,14 @@ void test_top_p(const std::vector<float> & probs,
     }
 
     llama_token_data_array candidates_p = { candidates.data(), candidates.size(), false };
+    llama_sample_softmax(nullptr, &candidates_p);
     // DUMP(&candidates_p);
     llama_sample_top_p(nullptr, &candidates_p, p);
     // DUMP(&candidates_p);
 
     assert(candidates_p.size == expected_probs.size());
     for (size_t i = 0; i < candidates_p.size; i++) {
-        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-5);
+        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);
     }
 }
 
@@ -82,7 +86,7 @@ void test_tfs(const std::vector<float> & probs,
 
     assert(candidates_p.size == expected_probs.size());
     for (size_t i = 0; i < candidates_p.size; i++) {
-        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-6);
+        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);
     }
 }
 
@@ -105,7 +109,7 @@ void test_typical(const std::vector<float> & probs,
 
     assert(candidates_p.size == expected_probs.size());
     for (size_t i = 0; i < candidates_p.size; i++) {
-        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-6);
+        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);
     }
 }
 
@@ -163,7 +167,7 @@ void test_frequency_presence_penalty(
 
     assert(candidates_p.size == expected_probs.size());
     for (size_t i = 0; i < candidates_p.size; i++) {
-        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-6);
+        assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);
     }
 }
 
@@ -182,9 +186,9 @@ int main(void) {
     test_typical({0.97, 0.01, 0.01, 0.01}, {0.97}, 0.5);
     test_typical({0.4, 0.2, 0.2, 0.2}, {0.2, 0.2, 0.2}, 0.5);
 
-    test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0}, {0, 0.25, 0.25, 0.25, 0.25}, 50.0);
-    test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2}, {0, 0, 0, 0.5, 0.5}, 50.0);
-    test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2, 0, 0}, {0, 0, 0, 0.5, 0.5}, 50.0);
+    test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0}, {0.25, 0.25, 0.25, 0.25, 0}, 50.0);
+    test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2}, {0.5, 0.5, 0, 0, 0}, 50.0);
+    test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2, 0, 0}, {0.5, 0.5, 0, 0, 0}, 50.0);
 
     test_frequency_presence_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0},             {0.249997, 0.249997, 0.249997, 0.249997, 0.000011}, 5.0, 5.0);
     test_frequency_presence_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2},       {0.499966, 0.499966, 0.000023, 0.000023, 0.000023}, 5.0, 5.0);

Original file line number	Diff line number	Diff line change
`@@ -7,6 +7,9 @@`
`7`	`7`	`#include <vector>`
`8`	`8`	`#include <algorithm>`
`9`	`9`
	`10`	`+#undef assert`
	`11`	`+#define assert(__expr) do { if (!(__expr)) { printf("%s:%d (%s) %s\n", __FILE__, __LINE__, __func__, #__expr); exit(1); } } while(0)`
	`12`	`+`
`10`	`13`	`void dump(const llama_token_data_array * candidates) {`
`11`	`14`	`for (size_t i = 0; i < candidates->size; i++) {`
`12`	`15`	`printf("%d: %f (%f)\n", candidates->data[i].id, candidates->data[i].p, candidates->data[i].logit);`
`@@ -53,13 +56,14 @@ void test_top_p(const std::vector<float> & probs,`
`53`	`56`	`}`
`54`	`57`
`55`	`58`	`llama_token_data_array candidates_p = { candidates.data(), candidates.size(), false };`
	`59`	`+ llama_sample_softmax(nullptr, &candidates_p);`
`56`	`60`	`// DUMP(&candidates_p);`
`57`	`61`	`llama_sample_top_p(nullptr, &candidates_p, p);`
`58`	`62`	`// DUMP(&candidates_p);`
`59`	`63`
`60`	`64`	`assert(candidates_p.size == expected_probs.size());`
`61`	`65`	`for (size_t i = 0; i < candidates_p.size; i++) {`
`62`		`- assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-5);`
	`66`	`+ assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);`
`63`	`67`	`}`
`64`	`68`	`}`
`65`	`69`
`@@ -82,7 +86,7 @@ void test_tfs(const std::vector<float> & probs,`
`82`	`86`
`83`	`87`	`assert(candidates_p.size == expected_probs.size());`
`84`	`88`	`for (size_t i = 0; i < candidates_p.size; i++) {`
`85`		`- assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-6);`
	`89`	`+ assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);`
`86`	`90`	`}`
`87`	`91`	`}`
`88`	`92`
`@@ -105,7 +109,7 @@ void test_typical(const std::vector<float> & probs,`
`105`	`109`
`106`	`110`	`assert(candidates_p.size == expected_probs.size());`
`107`	`111`	`for (size_t i = 0; i < candidates_p.size; i++) {`
`108`		`- assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-6);`
	`112`	`+ assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);`
`109`	`113`	`}`
`110`	`114`	`}`
`111`	`115`
`@@ -163,7 +167,7 @@ void test_frequency_presence_penalty(`
`163`	`167`
`164`	`168`	`assert(candidates_p.size == expected_probs.size());`
`165`	`169`	`for (size_t i = 0; i < candidates_p.size; i++) {`
`166`		`- assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-6);`
	`170`	`+ assert(fabs(candidates_p.data[i].p - expected_probs[i]) < 1e-3);`
`167`	`171`	`}`
`168`	`172`	`}`
`169`	`173`
`@@ -182,9 +186,9 @@ int main(void) {`
`182`	`186`	`test_typical({0.97, 0.01, 0.01, 0.01}, {0.97}, 0.5);`
`183`	`187`	`test_typical({0.4, 0.2, 0.2, 0.2}, {0.2, 0.2, 0.2}, 0.5);`
`184`	`188`
`185`		`- test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0}, {0, 0.25, 0.25, 0.25, 0.25}, 50.0);`
`186`		`- test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2}, {0, 0, 0, 0.5, 0.5}, 50.0);`
`187`		`- test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2, 0, 0}, {0, 0, 0, 0.5, 0.5}, 50.0);`
	`189`	`+ test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0}, {0.25, 0.25, 0.25, 0.25, 0}, 50.0);`
	`190`	`+ test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2}, {0.5, 0.5, 0, 0, 0}, 50.0);`
	`191`	`+ test_repetition_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2, 0, 0}, {0.5, 0.5, 0, 0, 0}, 50.0);`
`188`	`192`
`189`	`193`	`test_frequency_presence_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0}, {0.249997, 0.249997, 0.249997, 0.249997, 0.000011}, 5.0, 5.0);`
`190`	`194`	`test_frequency_presence_penalty({0.2, 0.2, 0.2, 0.2, 0.2}, {0, 1, 2}, {0.499966, 0.499966, 0.000023, 0.000023, 0.000023}, 5.0, 5.0);`