jlewi · jlewi · Oct 15, 2024 · Oct 15, 2024 · Oct 15, 2024 · Oct 15, 2024
diff --git a/app/pkg/agent/agent.go b/app/pkg/agent/agent.go
@@ -6,6 +6,8 @@ import (
 	"strings"
 	"sync"
 
+	"github.com/jlewi/foyle/app/pkg/runme/ulid"
+
 	"github.com/jlewi/foyle/protos/go/foyle/v1alpha1/v1alpha1connect"
 
 	"google.golang.org/protobuf/encoding/protojson"
@@ -114,6 +116,8 @@ func (a *Agent) Generate(ctx context.Context, req *v1alpha1.GenerateRequest) (*v
 		return nil, err
 	}
 
+	log.Info(logs.Level1Assertion, "assertion", logs.BuildAssertion(v1alpha1.Assertion_AT_LEAST_ONE_BLOCK_POST_PROCESSED, len(postProcessed) > 0))
+
 	// Attach block ids to any blocks generated.
 	// N.B. This is kind of a last resort to make sure all blocks have an ID set. In general, we want to set blockIds
 	// earlier in the processing pipeline so that any log messages involving blocks has block ids set. BlockIDs
@@ -148,8 +152,9 @@ func (a *Agent) completeWithRetries(ctx context.Context, req *v1alpha1.GenerateR
 		})
 	}
 	for try := 0; try < maxTries; try++ {
+		docText := t.Text()
 		args := promptArgs{
-			Document: t.Text(),
+			Document: docText,
 			Examples: exampleArgs,
 		}
 
@@ -172,6 +177,29 @@ func (a *Agent) completeWithRetries(ctx context.Context, req *v1alpha1.GenerateR
 			return nil, errors.Wrapf(err, "CreateChatCompletion failed")
 		}
 
+		// Level1 assertion that docText is a non-empty string
+		assertion := &v1alpha1.Assertion{
+			Name:   v1alpha1.Assertion_NON_EMPTY_DOC,
+			Result: v1alpha1.AssertResult_PASSED,
+			Id:     ulid.GenerateID(),
+		}
+
+		if len(strings.TrimSpace(docText)) == 0 {
+			assertion.Result = v1alpha1.AssertResult_FAILED
+		}
+
+		log.Info(logs.Level1Assertion, "assertion", assertion)
+
+		assertBlocks := &v1alpha1.Assertion{
+			Name:   v1alpha1.Assertion_AT_LEAST_ONE_BLOCK,
+			Result: v1alpha1.AssertResult_PASSED,
+			Id:     ulid.GenerateID(),
+		}
+
+		if len(blocks) == 0 {
+			assertBlocks.Result = v1alpha1.AssertResult_FAILED
+		}
+		log.Info(logs.Level1Assertion, "assertion", assertion)
 		return blocks, nil
 	}
 	err := errors.Errorf("Failed to generate a chat completion after %d tries", maxTries)

diff --git a/app/pkg/analyze/fsql/eval_query.sql b/app/pkg/analyze/fsql/eval_query.sql
@@ -16,4 +16,14 @@ WHERE id = ?;
 SELECT * FROM results
 WHERE (:cursor = '' OR time < :cursor)
 ORDER BY time DESC
-    LIMIT :page_size;
+    LIMIT :page_size;
+
+-- name: CountResults :one
+-- Count the total number of results
+SELECT COUNT(*) FROM results;
+
+-- name: CountErrors :one
+SELECT COUNT(*) FROM results WHERE json_extract(proto_json, '$.error') IS NOT NULL;
+
+-- name: CountByCellsMatchResult :many
+SELECT json_extract(proto_json, '$.cellsMatchResult') as match_result, COUNT(*) as count FROM results GROUP BY match_result;
diff --git a/app/pkg/analyze/fsql/eval_query.sql.go b/app/pkg/analyze/fsql/eval_query.sql.go
diff --git a/app/pkg/eval/assert.go b/app/pkg/eval/assert.go
@@ -6,6 +6,8 @@ import (
 	"github.com/jlewi/foyle/protos/go/foyle/v1alpha1"
 )
 
+// TODO(jeremy): A lot of this code is probably obsolete now that we are using protos.
+
 // Assertion is an interface for evaluating AI generations.
 type Assertion interface {
 	Assert(ctx context.Context, doc *v1alpha1.Doc, examples []*v1alpha1.Example, answer []*v1alpha1.Block) (*v1alpha1.Assertion, error)
@@ -14,7 +16,3 @@ type Assertion interface {
 }
 
 type AssertResult string
-
-const AssertPassed AssertResult = "passed"
-const AssertFailed AssertResult = "failed"
-const AssertSkipped AssertResult = "skipped"
diff --git a/app/pkg/eval/assertions.go b/app/pkg/eval/assertions.go
@@ -20,7 +20,7 @@ type AssertCodeAfterMarkdown struct {
 
 func (a *AssertCodeAfterMarkdown) Assert(ctx context.Context, doc *v1alpha1.Doc, examples []*v1alpha1.Example, answer []*v1alpha1.Block) (*v1alpha1.Assertion, error) {
 	assertion := &v1alpha1.Assertion{
-		Name: a.Name(),
+		Name: v1alpha1.Assertion_CODE_AFTER_MARKDOWN,
 	}
 
 	if len(doc.Blocks) == 0 {
@@ -62,7 +62,7 @@ type AssertOneCodeCell struct {
 
 func (a *AssertOneCodeCell) Assert(ctx context.Context, doc *v1alpha1.Doc, examples []*v1alpha1.Example, answer []*v1alpha1.Block) (*v1alpha1.Assertion, error) {
 	assertion := &v1alpha1.Assertion{
-		Name: a.Name(),
+		Name: v1alpha1.Assertion_ONE_CODE_CELL,
 	}
 
 	if len(doc.Blocks) == 0 {
@@ -99,7 +99,7 @@ type AssertEndsWithCodeCell struct {
 
 func (a *AssertEndsWithCodeCell) Assert(ctx context.Context, doc *v1alpha1.Doc, examples []*v1alpha1.Example, answer []*v1alpha1.Block) (*v1alpha1.Assertion, error) {
 	assertion := &v1alpha1.Assertion{
-		Name: a.Name(),
+		Name: v1alpha1.Assertion_ENDS_WITH_CODE_CELL,
 	}
 
 	if len(doc.Blocks) == 0 {

diff --git a/app/pkg/eval/assertions_test.go b/app/pkg/eval/assertions_test.go
@@ -23,7 +23,7 @@ func TestAssertCodeAfterMarkdown(t *testing.T) {
 			examples: []*v1alpha1.Example{},
 			answer:   []*v1alpha1.Block{},
 			expected: &v1alpha1.Assertion{
-				Name:   "AssertCodeAfterMarkdown",
+				Name:   v1alpha1.Assertion_CODE_AFTER_MARKDOWN,
 				Result: v1alpha1.AssertResult_SKIPPED,
 			},
 		},
@@ -43,7 +43,7 @@ func TestAssertCodeAfterMarkdown(t *testing.T) {
 				},
 			},
 			expected: &v1alpha1.Assertion{
-				Name:   "AssertCodeAfterMarkdown",
+				Name:   v1alpha1.Assertion_CODE_AFTER_MARKDOWN,
 				Result: v1alpha1.AssertResult_PASSED,
 			},
 		},
@@ -63,7 +63,7 @@ func TestAssertCodeAfterMarkdown(t *testing.T) {
 				},
 			},
 			expected: &v1alpha1.Assertion{
-				Name:   "AssertCodeAfterMarkdown",
+				Name:   v1alpha1.Assertion_CODE_AFTER_MARKDOWN,
 				Result: v1alpha1.AssertResult_FAILED,
 			},
 		},
@@ -91,7 +91,7 @@ func TestAssertOneCodeCell(t *testing.T) {
 			examples: []*v1alpha1.Example{},
 			answer:   []*v1alpha1.Block{},
 			expected: &v1alpha1.Assertion{
-				Name:   "AssertCodeAfterMarkdown",
+				Name:   v1alpha1.Assertion_CODE_AFTER_MARKDOWN,
 				Result: v1alpha1.AssertResult_SKIPPED,
 			},
 		},
@@ -111,7 +111,7 @@ func TestAssertOneCodeCell(t *testing.T) {
 				},
 			},
 			expected: &v1alpha1.Assertion{
-				Name:   CodeAfterMarkdownName,
+				Name:   v1alpha1.Assertion_CODE_AFTER_MARKDOWN,
 				Result: v1alpha1.AssertResult_PASSED,
 			},
 		},
@@ -131,7 +131,7 @@ func TestAssertOneCodeCell(t *testing.T) {
 				},
 			},
 			expected: &v1alpha1.Assertion{
-				Name:   OneCodeCellName,
+				Name:   v1alpha1.Assertion_ONE_CODE_CELL,
 				Result: v1alpha1.AssertResult_FAILED,
 			},
 		},
@@ -159,7 +159,7 @@ func TestAssertEndsWithCodeCell(t *testing.T) {
 			examples: []*v1alpha1.Example{},
 			answer:   []*v1alpha1.Block{},
 			expected: &v1alpha1.Assertion{
-				Name:   EndsWithCodeCellName,
+				Name:   v1alpha1.Assertion_ENDS_WITH_CODE_CELL,
 				Result: v1alpha1.AssertResult_SKIPPED,
 			},
 		},
@@ -179,7 +179,7 @@ func TestAssertEndsWithCodeCell(t *testing.T) {
 				},
 			},
 			expected: &v1alpha1.Assertion{
-				Name:   EndsWithCodeCellName,
+				Name:   v1alpha1.Assertion_ENDS_WITH_CODE_CELL,
 				Result: v1alpha1.AssertResult_PASSED,
 			},
 		},
@@ -202,7 +202,7 @@ func TestAssertEndsWithCodeCell(t *testing.T) {
 				},
 			},
 			expected: &v1alpha1.Assertion{
-				Name:   EndsWithCodeCellName,
+				Name:   v1alpha1.Assertion_ENDS_WITH_CODE_CELL,
 				Result: v1alpha1.AssertResult_FAILED,
 			},
 		},