|
| 1 | +package com.evolvedbinary.bblValidator.service; |
| 2 | + |
| 3 | +import com.evolvedbinary.bblValidator.dto.ValidationError; |
| 4 | +import jakarta.inject.Inject; |
| 5 | +import jakarta.inject.Singleton; |
| 6 | +import org.slf4j.Logger; |
| 7 | +import org.slf4j.LoggerFactory; |
| 8 | +import uk.gov.nationalarchives.csv.validator.api.java.*; |
| 9 | + |
| 10 | +import java.nio.charset.Charset; |
| 11 | +import java.nio.file.Path; |
| 12 | +import java.util.ArrayList; |
| 13 | +import java.util.List; |
| 14 | + |
| 15 | +import static uk.gov.nationalarchives.csv.validator.api.CsvValidator$.MODULE$; |
| 16 | + |
| 17 | + |
| 18 | +@Singleton |
| 19 | +public class CsvValidationService { |
| 20 | + |
| 21 | + private static final Logger LOG = LoggerFactory.getLogger(CsvValidationService.class); |
| 22 | + private static final int DEFAULT_MAX_CHARS_PER_CELL = 8096; |
| 23 | + |
| 24 | + @Inject |
| 25 | + private SchemaService schemaService; |
| 26 | + |
| 27 | + public ValidationResult validateCsvFile(Path csvFilePath, String schemaId) { |
| 28 | + long startTime = System.currentTimeMillis(); |
| 29 | + try { |
| 30 | + String schemaFilePath = String.valueOf(schemaService.getSchemaFilePath(schemaId)); |
| 31 | + Charset csvEncoding = MODULE$.DEFAULT_ENCODING(); |
| 32 | + boolean validateUtf8Encoding = csvEncoding.name().equals("UTF-8"); |
| 33 | + Charset csvSchemaEncoding = MODULE$.DEFAULT_ENCODING(); |
| 34 | + boolean failFast = false; |
| 35 | + List<Substitution> pathSubstitutions = new ArrayList<>(); |
| 36 | + boolean enforceCaseSensitivePathChecks = false; |
| 37 | + boolean trace = false; |
| 38 | + boolean skipFileChecks = false; |
| 39 | + |
| 40 | + CsvValidatorJavaBridge.ValidationRequest validationRequest = new CsvValidatorJavaBridge.ValidationRequest( |
| 41 | + csvFilePath.toString(), csvEncoding, validateUtf8Encoding, schemaFilePath, |
| 42 | + csvSchemaEncoding, true, failFast, pathSubstitutions, |
| 43 | + enforceCaseSensitivePathChecks, trace, null, skipFileChecks, DEFAULT_MAX_CHARS_PER_CELL); |
| 44 | + |
| 45 | + CsvValidatorJavaBridge.ValidationResult result = CsvValidatorJavaBridge.validate(validationRequest); |
| 46 | + List<FailMessage> errors = result.errors(); |
| 47 | + long executionTime = System.currentTimeMillis() - startTime; |
| 48 | + return processValidationMessages(errors, executionTime); |
| 49 | + |
| 50 | + } catch (Exception e) { |
| 51 | + long executionTime = System.currentTimeMillis() - startTime; |
| 52 | + LOG.error("Error validating CSV file: {}", csvFilePath, e); |
| 53 | + return ValidationResult.error("Validation failed: " + e.getMessage(), executionTime); |
| 54 | + } |
| 55 | + } |
| 56 | + |
| 57 | + |
| 58 | + private ValidationResult processValidationMessages(List<FailMessage> messages, long executionTimeMs) { |
| 59 | + if (messages.isEmpty()) { |
| 60 | + LOG.info("CSV validation successful - no errors ({}ms)", executionTimeMs); |
| 61 | + return ValidationResult.success(executionTimeMs); |
| 62 | + } |
| 63 | + |
| 64 | + List<ValidationError> errors = new ArrayList<>(); |
| 65 | + |
| 66 | + for (FailMessage message : messages) { |
| 67 | + ValidationError error = new ValidationError( |
| 68 | + message.getMessage(), |
| 69 | + message.getLineNumber(), |
| 70 | + message.getColumnIndex() + 1 // Add 1 for user display |
| 71 | + ); |
| 72 | + errors.add(error); |
| 73 | + LOG.info("Validation error at line {}, column {}: {}", |
| 74 | + message.getLineNumber(), message.getColumnIndex(), message.getMessage()); |
| 75 | + } |
| 76 | + |
| 77 | + LOG.info("CSV validation completed - Valid: false, Errors: {} ({}ms)", errors.size(), executionTimeMs); |
| 78 | + return new ValidationResult(false, errors, executionTimeMs); |
| 79 | + } |
| 80 | + |
| 81 | + |
| 82 | + public static class ValidationResult { |
| 83 | + private final boolean valid; |
| 84 | + private final List<ValidationError> errors; |
| 85 | + private final String errorMessage; |
| 86 | + private final long executionTimeMs; |
| 87 | + |
| 88 | + public ValidationResult(boolean valid, List<ValidationError> errors, long executionTimeMs) { |
| 89 | + this.valid = valid; |
| 90 | + this.errors = errors; |
| 91 | + this.errorMessage = null; |
| 92 | + this.executionTimeMs = executionTimeMs; |
| 93 | + } |
| 94 | + |
| 95 | + private ValidationResult(String errorMessage, long executionTimeMs) { |
| 96 | + this.valid = false; |
| 97 | + this.errors = new ArrayList<>(); |
| 98 | + this.errorMessage = errorMessage; |
| 99 | + this.executionTimeMs = executionTimeMs; |
| 100 | + } |
| 101 | + |
| 102 | + public static ValidationResult success(long executionTimeMs) { |
| 103 | + return new ValidationResult(true, new ArrayList<>(), executionTimeMs); |
| 104 | + } |
| 105 | + |
| 106 | + public static ValidationResult error(String errorMessage, long executionTimeMs) { |
| 107 | + return new ValidationResult(errorMessage, executionTimeMs); |
| 108 | + } |
| 109 | + |
| 110 | + public boolean isValid() { |
| 111 | + return valid; |
| 112 | + } |
| 113 | + |
| 114 | + public List<ValidationError> getErrors() { |
| 115 | + return errors; |
| 116 | + } |
| 117 | + |
| 118 | + public String getErrorMessage() { |
| 119 | + return errorMessage; |
| 120 | + } |
| 121 | + |
| 122 | + public boolean hasErrorMessage() { |
| 123 | + return errorMessage != null; |
| 124 | + } |
| 125 | + |
| 126 | + public long getExecutionTimeMs() { |
| 127 | + return executionTimeMs; |
| 128 | + } |
| 129 | + } |
| 130 | +} |
0 commit comments