Let the "write-tests" prompt ask to extend the given source file in case tests should be next to the source

Andreas Humenberger · Andreas Humenberger · commit e6f868201520 · 2025-05-14T10:05:52.000+02:00
diff --git a/evaluate/task/test-integration/task_test.go b/evaluate/task/test-integration/task_test.go
@@ -109,9 +109,9 @@ func TestWriteTestsRun(t *testing.T) {
 
 			Setup: func(t *testing.T) {
 				var query any = bytesutil.StringTrimIndentations(`
-					Given the following Rust code file "src/plain.rs", provide tests for this code.
+					Given the following Rust code file "src/plain.rs", extend the code to include tests.
 					The tests should produce 100 percent code coverage and must compile.
-					The response must contain only the test code in a fenced code block and nothing else.
+					The response must contain the original source code and the tests in a fenced code block and nothing else.
 
 					` + "```" + `rust
 					pub fn plain() {
@@ -127,6 +127,10 @@ func TestWriteTestsRun(t *testing.T) {
 					&provider.QueryResult{
 						Message: bytesutil.StringTrimIndentations(`
 							` + "```rust`" + `
+							pub fn plain() {
+								// This does not do anything but it gives us a line to cover.
+							}
+
 							#[cfg(test)]
 							mod tests {
 								use super::*;
@@ -151,8 +155,8 @@ func TestWriteTestsRun(t *testing.T) {
 			ExpectedRepositoryAssessment: map[string]map[evaltask.Identifier]metrics.Assessments{
 				filepath.Join("src", "plain.rs"): {
 					evaluatetask.IdentifierWriteTests: metrics.Assessments{
-						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 84,
-						metrics.AssessmentKeyResponseCharacterCount:             98,
+						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 167,
+						metrics.AssessmentKeyResponseCharacterCount:             181,
 						metrics.AssessmentKeyCoverage:                           3,
 						metrics.AssessmentKeyFilesExecuted:                      1,
 						metrics.AssessmentKeyFilesExecutedMaximumReachable:      1,
@@ -161,8 +165,8 @@ func TestWriteTestsRun(t *testing.T) {
 						metrics.AssessmentKeyResponseWithCode:                   1,
 					},
 					evaluatetask.IdentifierWriteTestsSymflowerFix: metrics.Assessments{
-						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 84,
-						metrics.AssessmentKeyResponseCharacterCount:             98,
+						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 167,
+						metrics.AssessmentKeyResponseCharacterCount:             181,
 						metrics.AssessmentKeyCoverage:                           3,
 						metrics.AssessmentKeyFilesExecuted:                      1,
 						metrics.AssessmentKeyFilesExecutedMaximumReachable:      1,
@@ -171,8 +175,8 @@ func TestWriteTestsRun(t *testing.T) {
 						metrics.AssessmentKeyResponseWithCode:                   1,
 					},
 					evaluatetask.IdentifierWriteTestsSymflowerTemplate: metrics.Assessments{
-						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 84,
-						metrics.AssessmentKeyResponseCharacterCount:             98,
+						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 167,
+						metrics.AssessmentKeyResponseCharacterCount:             181,
 						metrics.AssessmentKeyCoverage:                           3,
 						metrics.AssessmentKeyFilesExecuted:                      1,
 						metrics.AssessmentKeyFilesExecutedMaximumReachable:      1,
@@ -181,8 +185,8 @@ func TestWriteTestsRun(t *testing.T) {
 						metrics.AssessmentKeyResponseWithCode:                   1,
 					},
 					evaluatetask.IdentifierWriteTestsSymflowerTemplateSymflowerFix: metrics.Assessments{
-						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 84,
-						metrics.AssessmentKeyResponseCharacterCount:             98,
+						metrics.AssessmentKeyGenerateTestsForFileCharacterCount: 167,
+						metrics.AssessmentKeyResponseCharacterCount:             181,
 						metrics.AssessmentKeyCoverage:                           3,
 						metrics.AssessmentKeyFilesExecuted:                      1,
 						metrics.AssessmentKeyFilesExecutedMaximumReachable:      1,
diff --git a/model/llm/llm.go b/model/llm/llm.go
@@ -2,7 +2,6 @@ package llm
 
 import (
 	"context"
-	"errors"
 	"os"
 	"path/filepath"
 	"strings"
@@ -148,9 +147,13 @@ type llmWriteTestSourceFilePromptContext struct {
 
 // llmWriteTestForFilePromptTemplate is the template for generating an LLM test generation prompt.
 var llmWriteTestForFilePromptTemplate = template.Must(template.New("model-llm-write-test-for-file-prompt").Parse(bytesutil.StringTrimIndentations(`
-	Given the following {{ .Language.Name }} code file "{{ .FilePath }}" {{- with .ImportPath }} with package "{{ . }}" {{- end }}, provide {{- if .HasTestsInSource }} tests {{ else }} a test file {{ end -}} for this code{{ with .TestFramework }} with {{ . }} as a test framework{{ end }}.
+	Given the following {{ .Language.Name }} code file "{{ .FilePath }}" {{- with .ImportPath }} with package "{{ . }}" {{- end }}, {{- if .HasTestsInSource }} extend the code to include tests{{ else }} provide a test file for this code{{ with .TestFramework }} with {{ . }} as a test framework{{ end }}{{ end -}}.
 	The tests should produce 100 percent code coverage and must compile.
+	{{- if .HasTestsInSource }}
+	The response must contain the original source code and the tests in a fenced code block and nothing else.
+	{{- else }}
 	The response must contain only the test code in a fenced code block and nothing else.
+	{{- end }}
 
 	` + "```" + `{{ .Language.ID }}
 	{{ .Code }}
@@ -337,7 +340,7 @@ func (m *Model) WriteTests(ctx model.Context) (assessment metrics.Assessments, e
 		filePath = filepath.Join(ctx.RepositoryPath, ctx.Language.TestFilePath(ctx.RepositoryPath, ctx.FilePath))
 	}
 
-	return handleQueryResult(queryResult, filePath, ctx.HasTestsInSource)
+	return handleQueryResult(queryResult, filePath)
 }
 
 func (m *Model) query(logger *log.Logger, request string) (queryResult *provider.QueryResult, err error) {
@@ -422,7 +425,7 @@ func (m *Model) RepairCode(ctx model.Context) (assessment metrics.Assessments, e
 		return nil, pkgerrors.WithStack(err)
 	}
 
-	return handleQueryResult(queryResult, filepath.Join(ctx.RepositoryPath, ctx.FilePath), false)
+	return handleQueryResult(queryResult, filepath.Join(ctx.RepositoryPath, ctx.FilePath))
 }
 
 var _ model.CapabilityTranspile = (*Model)(nil)
@@ -469,7 +472,7 @@ func (m *Model) Transpile(ctx model.Context) (assessment metrics.Assessments, er
 		return nil, pkgerrors.WithStack(err)
 	}
 
-	return handleQueryResult(queryResult, filepath.Join(ctx.RepositoryPath, ctx.FilePath), false)
+	return handleQueryResult(queryResult, filepath.Join(ctx.RepositoryPath, ctx.FilePath))
 }
 
 var _ model.CapabilityMigrate = (*Model)(nil)
@@ -509,10 +512,10 @@ func (m *Model) Migrate(ctx model.Context) (assessment metrics.Assessments, err
 		return nil, pkgerrors.WithStack(err)
 	}
 
-	return handleQueryResult(queryResult, filepath.Join(ctx.RepositoryPath, ctx.FilePath), false)
+	return handleQueryResult(queryResult, filepath.Join(ctx.RepositoryPath, ctx.FilePath))
 }
 
-func handleQueryResult(queryResult *provider.QueryResult, filePathAbsolute string, appendFile bool) (assessment metrics.Assessments, err error) {
+func handleQueryResult(queryResult *provider.QueryResult, filePathAbsolute string) (assessment metrics.Assessments, err error) {
 	assessment, sourceFileContent, err := prompt.ParseResponse(queryResult.Message)
 	if err != nil {
 		return nil, pkgerrors.WithStack(err)
@@ -536,22 +539,7 @@ func handleQueryResult(queryResult *provider.QueryResult, filePathAbsolute strin
 		return nil, pkgerrors.WithStack(err)
 	}
 
-	flags := os.O_WRONLY | os.O_CREATE
-	if appendFile {
-		flags = flags | os.O_APPEND
-	} else {
-		flags = flags | os.O_TRUNC
-	}
-	file, err := os.OpenFile(filePathAbsolute, flags, 0644)
-	if err != nil {
-		return nil, pkgerrors.WithStack(err)
-	}
-	defer func() {
-		if closeErr := file.Close(); closeErr != nil {
-			err = errors.Join(err, pkgerrors.WithStack(closeErr))
-		}
-	}()
-	if _, err := file.WriteString(sourceFileContent); err != nil {
+	if err := os.WriteFile(filePathAbsolute, []byte(sourceFileContent), 0644); err != nil {
 		return nil, pkgerrors.WithStack(err)
 	}
 
diff --git a/model/llm/llm_test.go b/model/llm/llm_test.go
@@ -708,9 +708,9 @@ func TestFormatPromptContext(t *testing.T) {
 			},
 
 			ExpectedMessage: bytesutil.StringTrimIndentations(`
-				Given the following Rust code file "path/to/main.rs", provide tests for this code.
+				Given the following Rust code file "path/to/main.rs", extend the code to include tests.
 				The tests should produce 100 percent code coverage and must compile.
-				The response must contain only the test code in a fenced code block and nothing else.
+				The response must contain the original source code and the tests in a fenced code block and nothing else.
 
 				` + "```" + `rust
 				fn main() {