Merge pull request #427 from totocaca123/manage_csv_delimiter

totocaca123 · web-flow · commit 1f2d53c4e15b · 2025-03-11T02:38:09.000+01:00
add_csv_delimiter detect
diff --git a/etc/Jenkinsfile b/etc/Jenkinsfile
@@ -9,7 +9,11 @@ pipeline {
 				publishReport name: "Second JSON Report", displayType: "dual", provider: json(pattern: "etc/report-2.json")
 				publishReport name: "XML Report", displayType: "dual", provider: xml(pattern: "etc/*.xml")
 				publishReport name: "YAML Report", displayType: "dual", provider: yaml(pattern: "etc/*.yaml")
+				
 				publishReport name: "CSV Report Test", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report.csv")
+				publishReport name: "CSV Report Test Tabs", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report_tabulation.csv")
+				publishReport name: "CSV Report Test SemiColon", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report_semicolon.csv")
+
 				publishReport name: "CSV Report Test Robustness", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report_robust.csv")
 			} 
 		}
diff --git a/etc/report_semicolon.csv b/etc/report_semicolon.csv
@@ -0,0 +1,7 @@
+Level 1;Level 2;Level 3;incorrect;manually;accurate
+Aktie;Aktie 1;Aktie 1 1;13;3;59
+Aktie;Aktie 1;Aktie 1 2;31;48;9
+Aktie;Aktie 1;Aktie 1 3;34;8;51 
+Derivat;Derivat 1;;1;2;3
+Derivat;Derivat 2;;5;9;1
+Not Found;;;1;3;9
diff --git a/etc/report_tabulation.csv b/etc/report_tabulation.csv
@@ -0,0 +1,7 @@
+Level 1	Level 2	Level 3	incorrect	manually	accurate
+Aktie	Aktie 1	Aktie 1 1	13	3	59
+Aktie	Aktie 1	Aktie 1 2	31	48	9
+Aktie	Aktie 1	Aktie 1 3	34	8	51 
+Derivat	Derivat 1		1	2	3
+Derivat	Derivat 2		5	9	1
+Not Found			1	3	9
diff --git a/src/main/java/io/jenkins/plugins/reporter/provider/Csv.java b/src/main/java/io/jenkins/plugins/reporter/provider/Csv.java
@@ -17,27 +17,31 @@
 import org.kohsuke.stapler.DataBoundConstructor;
 
 import java.io.File;
+import java.io.BufferedReader;
 import java.io.IOException;
 import java.util.*;
+import java.io.FileInputStream;
+import java.io.InputStreamReader;
+import java.nio.charset.StandardCharsets;
 
 public class Csv extends Provider {
-    
+
     private static final long serialVersionUID = 9141170397250309265L;
 
     private static final String ID = "csv";
-    
+
     @DataBoundConstructor
     public Csv() {
         super();
         // empty constructor required for stapler
     }
-    
+
     @Override
     public ReportParser createParser() {
         if (getActualId().equals(getDescriptor().getId())) {
             throw new IllegalArgumentException(Messages.Provider_Error());
         }
-        
+
         return new CsvCustomParser(getActualId());
     }
 
@@ -54,9 +58,9 @@ public Descriptor() {
     public static class CsvCustomParser extends ReportParser {
 
         private static final long serialVersionUID = -8689695008930386640L;
-        
+
         private final String id;
-        
+
         private List<String> parserMessages;
 
         public CsvCustomParser(String id) {
@@ -69,17 +73,54 @@ public String getId() {
             return id;
         }
 
+        
+        private char detectDelimiter(File file) throws IOException {
+            // List of possible delimiters
+            char[] delimiters = { ',', ';', '\t', '|' };
+            int[] delimiterCounts = new int[delimiters.length];
+        
+            // Read the lines of the file to detect the delimiter
+            try (BufferedReader reader = new BufferedReader(new InputStreamReader(new FileInputStream(file), StandardCharsets.UTF_8))) {
+                int linesToCheck = 5; // Number of lines to check
+                int linesChecked = 0;
+        
+                String line;
+                while ((line = reader.readLine()) != null && linesChecked < linesToCheck) {
+                    for (int i = 0; i < delimiters.length; i++) {
+                        delimiterCounts[i] += StringUtils.countMatches(line, delimiters[i]);
+                    }
+                    linesChecked++;
+                }
+            }
+        
+            // Return the most frequent delimiter
+            int maxCount = 0;
+            char detectedDelimiter = 0;
+            for (int i = 0; i < delimiters.length; i++) {
+                if (delimiterCounts[i] > maxCount) {
+                    maxCount = delimiterCounts[i];
+                    detectedDelimiter = delimiters[i];
+                }
+            }
+        
+            return detectedDelimiter;
+        }
+        
+
         @Override
         public ReportDto parse(File file) throws IOException {
+            // Get delimiter
+            char delimiter = detectDelimiter(file);
 
             final CsvMapper mapper = new CsvMapper();
-            final CsvSchema schema = mapper.schemaFor(String[].class).withColumnSeparator(',');
+            final CsvSchema schema = mapper.schemaFor(String[].class).withColumnSeparator(delimiter);
 
             mapper.enable(CsvParser.Feature.WRAP_AS_ARRAY);
             mapper.enable(CsvParser.Feature.SKIP_EMPTY_LINES);
             mapper.enable(CsvParser.Feature.ALLOW_TRAILING_COMMA);
             mapper.enable(CsvParser.Feature.INSERT_NULLS_FOR_MISSING_COLUMNS);
             mapper.enable(CsvParser.Feature.TRIM_SPACES);
+
             final MappingIterator<List<String>> it = mapper.readerForListOf(String.class)
                     .with(schema)
                     .readValues(file);
@@ -100,6 +141,7 @@ public ReportDto parse(File file) throws IOException {
             } else {
                 parserMessages.add(String.format("skipped file - First line has %d elements", headerColumnCount + 1));
             }
+
             /** Parse all data rows */
             for (int rowIdx = 0; rowIdx < rowCount; rowIdx++) {
                 String parentId = "report";
@@ -116,20 +158,22 @@ public ReportDto parse(File file) throws IOException {
                     for (int colIdx = rowSize - 1; colIdx > 1; colIdx--) {
                         String value = row.get(colIdx);
 
-                        if (NumberUtils.isCreatable(value) == true) {
+                        if (NumberUtils.isCreatable(value)) {
                             colIdxValueStart = colIdx;
                         } else {
                             if (colIdxValueStart > 0) {
-                                parserMessages.add(String.format("Found data - fields number = %d  - numeric fields = %d", colIdxValueStart, rowSize - colIdxValueStart));
+                                parserMessages
+                                        .add(String.format("Found data - fields number = %d  - numeric fields = %d",
+                                                colIdxValueStart, rowSize - colIdxValueStart));
                             }
                             break;
                         }
                     }
                 }
 
-                String  valueId = "";
+                String valueId = "";
                 /** Parse line if first data line is OK and line has more element than header */
-                if ((colIdxValueStart > 0) && (rowSize >= headerColumnCount)){
+                if ((colIdxValueStart > 0) && (rowSize >= headerColumnCount)) {
                     /** Check line and header size matching */
                     for (int colIdx = 0; colIdx < headerColumnCount; colIdx++) {
                         String id = header.get(colIdx);
@@ -141,19 +185,22 @@ public ReportDto parse(File file) throws IOException {
                             if ((NumberUtils.isCreatable(value)) || (StringUtils.isBlank(value))) {
                                 /** Empty field found - message */
                                 if (colIdx == 0) {
-                                    parserMessages.add(String.format("skipped line %d - First column item empty - col = %d ", rowIdx + 2, colIdx + 1));
-                                    break ;
+                                    parserMessages
+                                            .add(String.format("skipped line %d - First column item empty - col = %d ",
+                                                    rowIdx + 2, colIdx + 1));
+                                    break;
                                 } else {
                                     emptyFieldFound = true;
                                     /** Continue next column parsing */
                                     continue;
                                 }
                             } else {
                                 /** Check if field values are present after empty cells */
-                                 if (emptyFieldFound == true) {
-                                     parserMessages.add(String.format("skipped line %d Empty field in col = %d ", rowIdx + 2, colIdx + 1));
-                                     break;
-                                 }
+                                if (emptyFieldFound) {
+                                    parserMessages.add(String.format("skipped line %d Empty field in col = %d ",
+                                            rowIdx + 2, colIdx + 1));
+                                    break;
+                                }
                             }
                             valueId += value;
                             Optional<Item> parent = report.findItem(parentId, report.getItems());
@@ -193,19 +240,20 @@ public ReportDto parse(File file) throws IOException {
                         parserMessages.add(String.format("skipped line %d - First data row not found", rowIdx + 2));
                         continue;
                     } else {
-                        parserMessages.add(String.format("skipped line %d - line has fewer element than title", rowIdx + 2));
+                        parserMessages
+                                .add(String.format("skipped line %d - line has fewer element than title", rowIdx + 2));
                         continue;
                     }
                 }
                 /** If last item was created, it will be added to report */
-                if (lastItemAdded == true) {
+                if (lastItemAdded) {
                     last.setResult(result);
                 } else {
                     parserMessages.add(String.format("ignored line %d - Same fields already exists", rowIdx + 2));
                 }
             }
-            //report.setParserLog(parserMessages);
+            // report.setParserLog(parserMessages);
             return report;
         }
     }
-}
+}

Original file line number	Diff line number	Diff line change
`@@ -9,7 +9,11 @@ pipeline {`
`9`	`9`	`publishReport name: "Second JSON Report", displayType: "dual", provider: json(pattern: "etc/report-2.json")`
`10`	`10`	`publishReport name: "XML Report", displayType: "dual", provider: xml(pattern: "etc/*.xml")`
`11`	`11`	`publishReport name: "YAML Report", displayType: "dual", provider: yaml(pattern: "etc/*.yaml")`
	`12`	`+`
`12`	`13`	`publishReport name: "CSV Report Test", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report.csv")`
	`14`	`+ publishReport name: "CSV Report Test Tabs", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report_tabulation.csv")`
	`15`	`+ publishReport name: "CSV Report Test SemiColon", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report_semicolon.csv")`
	`16`	`+`
`13`	`17`	`publishReport name: "CSV Report Test Robustness", displayType: "dual", provider: csv(id: "csv-one", pattern: "etc/report_robust.csv")`
`14`	`18`	`}`
`15`	`19`	`}`