Skip to content

Commit

Permalink
Store the task identifier and the repository name when reading the ev…
Browse files Browse the repository at this point in the history
…aluation CSV file, since they are part of an evaluation record

Part of #237
  • Loading branch information
ruiAzevedo19 committed Jul 9, 2024
1 parent ca25797 commit 496418c
Show file tree
Hide file tree
Showing 2 changed files with 30 additions and 13 deletions.
11 changes: 11 additions & 0 deletions evaluate/report/csv.go
Original file line number Diff line number Diff line change
Expand Up @@ -85,6 +85,11 @@ type EvaluationRecord struct {
// LanguageID holds the language id.
LanguageID string

// RepositoryName holds the name of a repository .
RepositoryName string
// Task holds the task identifier.
Task string

// Assessments holds the assessments of an entry.
Assessments metrics.Assessments
}
Expand Down Expand Up @@ -225,6 +230,9 @@ func convertRawRecordToEvaluationRecord(raw []string) (record *EvaluationRecord,

languageID := raw[3]

repositoryName := raw[4]
task := raw[5]

rawMetrics := raw[7:]
for i, assessementKey := range metrics.AllAssessmentKeysStrings {
metric, err := strconv.ParseUint(rawMetrics[i], 10, 64)
Expand All @@ -242,6 +250,9 @@ func convertRawRecordToEvaluationRecord(raw []string) (record *EvaluationRecord,

LanguageID: languageID,

RepositoryName: repositoryName,
Task: task,

Assessments: assessments,
}, nil
}
Expand Down
32 changes: 19 additions & 13 deletions evaluate/report/csv_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -257,10 +257,12 @@ func TestLoadEvaluationRecords(t *testing.T) {

ExpectedEvaluationRecords: EvaluationRecords{
&EvaluationRecord{
ModelID: "openrouter/anthropic/claude-1.2",
ModelName: "Claude 1.2",
ModelCost: 0.0001,
LanguageID: "golang",
ModelID: "openrouter/anthropic/claude-1.2",
ModelName: "Claude 1.2",
ModelCost: 0.0001,
LanguageID: "golang",
RepositoryName: "golang/light",
Task: "write-tests",
Assessments: metrics.Assessments{
metrics.AssessmentKeyCoverage: 750,
metrics.AssessmentKeyFilesExecuted: 18,
Expand All @@ -281,17 +283,19 @@ func TestLoadEvaluationRecords(t *testing.T) {
fileContent := bytesutil.StringTrimIndentations(`
model-id,model-name,cost,language,repository,task,score,coverage,files-executed,generate-tests-for-file-character-count,processing-time,response-character-count,response-no-error,response-no-excess,response-with-code
openrouter/anthropic/claude-1.2,Claude 1.2,0.0001,golang,golang/light,write-tests,982,750,18,70179,720571,71195,115,49,50
openrouter/anthropic/claude-1.2,Claude 1.2,0.0002,golang,golang/plain,write-tests,37,20,2,441,11042,523,5,5,5
openrouter/anthropic/claude-1.2,Claude 1.2,0.0002,golang,golang/plain,transpile,37,20,2,441,11042,523,5,5,5
`)
require.NoError(t, os.WriteFile(filepath.Join(resultPath, "evaluation.csv"), []byte(fileContent), 0644))
},

ExpectedEvaluationRecords: EvaluationRecords{
&EvaluationRecord{
ModelID: "openrouter/anthropic/claude-1.2",
ModelName: "Claude 1.2",
ModelCost: 0.0001,
LanguageID: "golang",
ModelID: "openrouter/anthropic/claude-1.2",
ModelName: "Claude 1.2",
ModelCost: 0.0001,
LanguageID: "golang",
RepositoryName: "golang/light",
Task: "write-tests",
Assessments: metrics.Assessments{
metrics.AssessmentKeyCoverage: 750,
metrics.AssessmentKeyFilesExecuted: 18,
Expand All @@ -304,10 +308,12 @@ func TestLoadEvaluationRecords(t *testing.T) {
},
},
&EvaluationRecord{
ModelID: "openrouter/anthropic/claude-1.2",
ModelName: "Claude 1.2",
ModelCost: 0.0002,
LanguageID: "golang",
ModelID: "openrouter/anthropic/claude-1.2",
ModelName: "Claude 1.2",
ModelCost: 0.0002,
LanguageID: "golang",
RepositoryName: "golang/plain",
Task: "transpile",
Assessments: metrics.Assessments{
metrics.AssessmentKeyCoverage: 20,
metrics.AssessmentKeyFilesExecuted: 2,
Expand Down

0 comments on commit 496418c

Please sign in to comment.