fix(evaluate): establish threshold for assessment results result (#457)

* feat(validate): establish threshold for assessment results result * feat(evaluate): support for single artifact props update * fix(evaluate): perform evaluation with parity for multiple files * fix(evaluate): separate write logic from core evaluation logic * fix(evaluate): refactor code to library and move/fix tests * fix(evaluate): add tests and cleanup various functions * fix(evaluate): cleanup testing files * fix(evaluate): WIP for tests and updated logic * fix(evaluate): updated logic and testing for edge case * fix(evaluate): additional testing after merge - updating merge logic * fix(oscal): updated merge logic for assessment results * fix(evaluate): cleanup, update props, testing --------- Co-authored-by: Cole (Mike) Winberry <[email protected]> Co-authored-by: Megan Wolf <[email protected]>
defenseunicorns · Jun 13, 2024 · 4571cb8 · 4571cb8
1 parent 679d2c8
commit 4571cb8
Show file tree

Hide file tree

Showing 7 changed files with 722 additions and 327 deletions.
diff --git a/docs/evaluate.md b/docs/evaluate.md
@@ -0,0 +1,40 @@
+# Compliance Evaluation
+
+Evaluate serves as a method for verifying the compliance of a component/system against an established threshold to determine if it is more or less compliant than a previous assessment. 
+
+## Expected Process
+
+### No Existing Data
+
+When no previous assessment exists, the initial assessment is made and stored with `lula validate`. This initial assessment by itself will always pass `lula evaluate` as there is no threshold for evaluation. Lula will automatically apply the `threshold` prop to the assessment result when writing the assessment result to a file that does not contain an existing assessment results artifact.
+
+steps:
+1. `lula validate`
+2. `lula evaluate` -> Passes with no Threshold
+
+### Existing Data (Intended Workflow)
+
+In workflows run manually or with automation (such as CI/CD), there is an expectation that the threshold exists, and evaluate will perform an analysis of the compliance of the system/component against the established threshold.
+
+steps:
+1. `lula validate`
+2. `lula evaluate` -> Passes or Fails based on threshold
+
+
+## Scenarios for Consideration
+
+Evaluate will determine which result is the threshold based on the following property:
+```yaml
+props:
+  - name: threshold
+    ns: https://docs.lula.dev/ns
+    value: "true/false"
+```
+
+### Assessment Results Artifact
+
+When evaluate is ran with a single assessment results artifact, it is expected that a single threshold with a `true` value exists. This will be identified and ran against the latest result to determine if compliance is less-than-equal (fail), equal (pass), or greater-than-equal (pass). When the comparison results in greater-than-equal, Lula will update the threshold `prop` for the latest result to `true` and set the previous result threshold prop to `false`.
+
+### Comparing multiple assessment results artifacts
+
+In the scenario where multiple assessment results artifacts are evaluated, there may be a multiple threshold results with a `true` value as Lula establishes a default `true` value when writing an assessment results artifact to a new file with no previous results present. In this case, Lula will use the older result as the threshold to determine compliance of the result.
diff --git a/src/cmd/evaluate/evaluate.go b/src/cmd/evaluate/evaluate.go
@@ -15,7 +15,7 @@ var evaluateHelp = `
 To evaluate the latest results in two assessment results files:
 	lula evaluate -f assessment-results-threshold.yaml -f assessment-results-new.yaml
 
-To evaluate two results (latest and preceding) in a single assessment results file:
+To evaluate two results (threshold and latest) in a single OSCAL file:
 	lula evaluate -f assessment-results.yaml
 `
 
@@ -33,11 +33,13 @@ var evaluateCmd = &cobra.Command{
 	Aliases: []string{"eval"},
 	Run: func(cmd *cobra.Command, args []string) {
 
-		// Access the files and evaluate them
-		err := EvaluateAssessmentResults(opts.files)
+		// Build map of filepath -> assessment results
+		assessmentMap, err := readManyAssessmentResults(opts.files)
 		if err != nil {
 			message.Fatal(err, err.Error())
 		}
+
+		EvaluateAssessments(assessmentMap)
 	},
 }
 
@@ -48,132 +50,105 @@ func EvaluateCommand() *cobra.Command {
 	return evaluateCmd
 }
 
-func EvaluateAssessmentResults(fileArray []string) error {
-	var status bool
-	var findings map[string][]oscalTypes_1_1_2.Finding
-
-	// Read in files - establish the results to
-	if len(fileArray) == 0 {
-		// TODO: Determine if we will handle a default location/name for assessment files
-		return fmt.Errorf("No files provided for evaluation")
-	}
-
-	for _, f := range fileArray {
-		err := files.IsJsonOrYaml(f)
-		if err != nil {
-			return fmt.Errorf("invalid file extension: %s, requires .json or .yaml", f)
+func EvaluateAssessments(assessmentMap map[string]*oscalTypes_1_1_2.AssessmentResults) {
+	// Identify the threshold & latest for comparison
+	resultMap, err := oscal.IdentifyResults(assessmentMap)
+	if err != nil {
+		if err.Error() == "less than 2 results found - no comparison possible" {
+			// Catch and warn of insufficient results
+			message.Warn(err.Error())
+			return
+		} else {
+			message.Fatal(err, err.Error())
 		}
 	}
 
-	if len(fileArray) == 1 {
-		data, err := common.ReadFileToBytes(fileArray[0])
-		if err != nil {
-			return err
-		}
-		assessment, err := oscal.NewAssessmentResults(data)
-		if err != nil {
-			return err
-		}
-		if len(assessment.Results) < 2 {
-			return fmt.Errorf("2 or more result objects must be present for evaluation\n")
-		}
-		// We write results to the assessment-results report in newest -> oldest
-		// Older being our threshold here
-		status, findings, err = EvaluateResults(&assessment.Results[1], &assessment.Results[0])
-		if err != nil {
-			return err
-		}
+	if resultMap["threshold"] != nil && resultMap["latest"] != nil {
+		// Compare the assessment results
+		spinner := message.NewProgressSpinner("Evaluating Assessment Results %s against %s", resultMap["threshold"].UUID, resultMap["latest"].UUID)
+		defer spinner.Stop()
 
-	} else if len(fileArray) == 2 {
-		data, err := common.ReadFileToBytes(fileArray[0])
-		if err != nil {
-			return err
-		}
-		assessmentOne, err := oscal.NewAssessmentResults(data)
-		if err != nil {
-			return err
-		}
-		data, err = common.ReadFileToBytes(fileArray[1])
-		if err != nil {
-			return err
-		}
-		assessmentTwo, err := oscal.NewAssessmentResults(data)
+		status, findings, err := oscal.EvaluateResults(resultMap["threshold"], resultMap["latest"])
 		if err != nil {
-			return err
+			message.Fatal(err, err.Error())
 		}
 
-		// Consider parsing the timestamps for comparison
-		// Older timestamp being the threshold
+		if status {
+			if len(findings["new-passing-findings"]) > 0 {
+				message.Info("New passing finding Target-Ids:")
+				for _, finding := range findings["new-passing-findings"] {
+					message.Infof("%s", finding.Target.TargetId)
+				}
 
-		status, findings, err = EvaluateResults(&assessmentOne.Results[0], &assessmentTwo.Results[0])
-		if err != nil {
-			return err
-		}
-	} else {
-		return fmt.Errorf("Exceeded maximum of 2 files for evaluation\n")
-	}
+				message.Infof("New threshold identified - threshold will be updated to result %s", resultMap["latest"].UUID)
 
-	if status {
-		message.Info("Evaluation Passing the established threshold")
-		if len(findings["new-findings"]) > 0 {
-			message.Info("New finding Target-Ids:")
-			for _, finding := range findings["new-findings"] {
-				message.Infof("%s", finding.Target.TargetId)
+				// Update latest threshold prop
+				oscal.UpdateProps("threshold", "https://docs.lula.dev/ns", "true", resultMap["latest"].Props)
+			} else {
+				// retain result as threshold
+				oscal.UpdateProps("threshold", "https://docs.lula.dev/ns", "true", resultMap["threshold"].Props)
 			}
+
+			if len(findings["new-failing-findings"]) > 0 {
+				message.Info("New failing finding Target-Ids:")
+				for _, finding := range findings["new-failing-findings"] {
+					message.Infof("%s", finding.Target.TargetId)
+				}
+			}
+
+		} else {
+			message.Warn("Evaluation Failed against the following findings:")
+			for _, finding := range findings["no-longer-satisfied"] {
+				message.Warnf("%s", finding.Target.TargetId)
+			}
+			message.Fatalf(fmt.Errorf("failed to meet established threshold"), "failed to meet established threshold")
+
+			// retain result as threshold
+			oscal.UpdateProps("threshold", "https://docs.lula.dev/ns", "true", resultMap["threshold"].Props)
 		}
-		return nil
+
+		spinner.Success()
+
+	} else if resultMap["threshold"] == nil {
+		message.Fatal(fmt.Errorf("no threshold assessment results could be identified"), "no threshold assessment results could be identified")
 	} else {
-		message.Warn("Evaluation Failed against the following findings:")
-		for _, finding := range findings["no-longer-satisfied"] {
-			message.Warnf("%s", finding.Target.TargetId)
+		message.Fatal(fmt.Errorf("no latest assessment results could be identified"), "no latest assessment results could be identified")
+	}
+
+	// Write each file back in the case of modification
+	for filePath, assessment := range assessmentMap {
+		model := oscalTypes_1_1_2.OscalCompleteSchema{
+			AssessmentResults: assessment,
 		}
-		return fmt.Errorf("Failed to meet established threshold")
+
+		oscal.WriteOscalModel(filePath, &model)
 	}
 }
 
-func EvaluateResults(thresholdResult *oscalTypes_1_1_2.Result, newResult *oscalTypes_1_1_2.Result) (bool, map[string][]oscalTypes_1_1_2.Finding, error) {
-	if thresholdResult == nil || thresholdResult.Findings == nil || newResult == nil || newResult.Findings == nil {
-		return false, nil, fmt.Errorf("results must contain findings to evaluate")
+// Read many filepaths into a map[filepath]*AssessmentResults
+// Placing here until otherwise decided on value elsewhere
+func readManyAssessmentResults(fileArray []string) (map[string]*oscalTypes_1_1_2.AssessmentResults, error) {
+	if len(fileArray) == 0 {
+		return nil, fmt.Errorf("no files provided for evaluation")
 	}
 
-	spinner := message.NewProgressSpinner("Evaluating Assessment Results %s against %s", newResult.UUID, thresholdResult.UUID)
-	defer spinner.Stop()
-
-	// Store unique findings for review here
-	findings := make(map[string][]oscalTypes_1_1_2.Finding, 0)
-	result := true
-
-	findingMapThreshold := oscal.GenerateFindingsMap(*thresholdResult.Findings)
-	findingMapNew := oscal.GenerateFindingsMap(*newResult.Findings)
-
-	// For a given oldResult - we need to prove that the newResult implements all of the oldResult findings/controls
-	// We are explicitly iterating through the findings in order to collect a delta to display
-
-	for targetId, finding := range findingMapThreshold {
-		if _, ok := findingMapNew[targetId]; !ok {
-			// If the new result does not contain the finding of the old result
-			// set result to fail, add finding to the findings map and continue
-			result = false
-			findings[targetId] = append(findings["no-longer-satisfied"], finding)
-		} else {
-			// If the finding is present in each map - we need to check if the state has changed from "not-satisfied" to "satisfied"
-			if finding.Target.Status.State == "satisfied" {
-				// Was previously satisfied - compare state
-				if findingMapNew[targetId].Target.Status.State == "not-satisfied" {
-					// If the new finding is now not-satisfied - set result to false and add to findings
-					result = false
-					findings["no-longer-satisfied"] = append(findings["no-longer-satisfied"], finding)
-				}
-			}
-			delete(findingMapNew, targetId)
+	assessmentMap := make(map[string]*oscalTypes_1_1_2.AssessmentResults)
+	for _, fileString := range fileArray {
+		err := files.IsJsonOrYaml(fileString)
+		if err != nil {
+			return nil, fmt.Errorf("invalid file extension: %s, requires .json or .yaml", fileString)
 		}
-	}
 
-	// All remaining findings in the new map are new findings
-	for _, finding := range findingMapNew {
-		findings["new-findings"] = append(findings["new-findings"], finding)
+		data, err := common.ReadFileToBytes(fileString)
+		if err != nil {
+			return nil, err
+		}
+		assessment, err := oscal.NewAssessmentResults(data)
+		if err != nil {
+			return nil, err
+		}
+		assessmentMap[fileString] = assessment
 	}
 
-	spinner.Success()
-	return result, findings, nil
+	return assessmentMap, nil
 }