CSVStrategy is now immutable (SANDBOX-279)

ebourg · ebourg · commit 42476f4b08fe · 2011-11-09T16:21:23.000Z
git-svn-id: https://svn.apache.org/repos/asf/commons/sandbox/csv/trunk@1199827 13f79535-47bb-0310-9956-ffa450edef68
diff --git a/src/main/java/org/apache/commons/csv/CSVParser.java b/src/main/java/org/apache/commons/csv/CSVParser.java
@@ -122,7 +122,7 @@ Token reset() {
      * @param input a Reader containing "csv-formatted" input
      */
     public CSVParser(Reader input) {
-        this(input, (CSVStrategy) CSVStrategy.DEFAULT_STRATEGY.clone());
+        this(input, CSVStrategy.DEFAULT_STRATEGY);
     }
 
     /**
@@ -260,7 +260,7 @@ Token nextToken(Token tkn) throws IOException {
         c = in.readAgain();
 
         //  empty line detection: eol AND (last char was EOL or beginning)
-        while (strategy.getIgnoreEmptyLines() && eol
+        while (strategy.isEmptyLinesIgnored() && eol
                 && (lastChar == '\n'
                 || lastChar == '\r'
                 || lastChar == ExtendedBufferedReader.UNDEFINED)
@@ -286,7 +286,7 @@ Token nextToken(Token tkn) throws IOException {
         //  important: make sure a new char gets consumed in each iteration
         while (!tkn.isReady && tkn.type != TT_EOF) {
             // ignore whitespaces at beginning of a token
-            while (strategy.getIgnoreLeadingWhitespaces() && isWhitespace(c) && !eol) {
+            while (strategy.isLeadingSpacesIgnored() && isWhitespace(c) && !eol) {
                 wsBuf.append((char) c);
                 c = in.read();
                 eol = isEndOfLine(c);
@@ -316,7 +316,7 @@ Token nextToken(Token tkn) throws IOException {
             } else {
                 // next token must be a simple token
                 // add removed blanks when not ignoring whitespace chars...
-                if (!strategy.getIgnoreLeadingWhitespaces()) {
+                if (!strategy.isLeadingSpacesIgnored()) {
                     tkn.content.append(wsBuf);
                 }
                 simpleTokenLexer(tkn, c);
@@ -359,7 +359,7 @@ private Token simpleTokenLexer(Token tkn, int c) throws IOException {
                 tkn.type = TT_TOKEN;
                 tkn.isReady = true;
                 break;
-            } else if (c == '\\' && strategy.getUnicodeEscapeInterpretation() && in.lookAhead() == 'u') {
+            } else if (c == '\\' && strategy.isUnicodeEscapesInterpreted() && in.lookAhead() == 'u') {
                 // interpret unicode escaped chars (like \u0070 -> p)
                 tkn.content.append((char) unicodeEscapeLexer(c));
             } else if (c == strategy.getEscape()) {
@@ -371,7 +371,7 @@ private Token simpleTokenLexer(Token tkn, int c) throws IOException {
             c = in.read();
         }
 
-        if (strategy.getIgnoreTrailingWhitespaces()) {
+        if (strategy.isTrailingSpacesIgnored()) {
             tkn.content.trimTrailingWhitespace();
         }
 
@@ -400,7 +400,7 @@ private Token encapsulatedTokenLexer(Token tkn, int c) throws IOException {
         for (; ;) {
             c = in.read();
 
-            if (c == '\\' && strategy.getUnicodeEscapeInterpretation() && in.lookAhead() == 'u') {
+            if (c == '\\' && strategy.isUnicodeEscapesInterpreted() && in.lookAhead() == 'u') {
                 tkn.content.append((char) unicodeEscapeLexer(c));
             } else if (c == strategy.getEscape()) {
                 tkn.content.append((char) readEscape(c));
diff --git a/src/main/java/org/apache/commons/csv/CSVPrinter.java b/src/main/java/org/apache/commons/csv/CSVPrinter.java
@@ -58,7 +58,7 @@ public CSVPrinter(Writer out, CSVStrategy strategy) {
      * Output a blank line
      */
     public void println() throws IOException {
-        out.write(strategy.getPrinterNewline());
+        out.write(strategy.getLineSeparator());
         newLine = true;
     }
 
diff --git a/src/main/java/org/apache/commons/csv/CSVStrategy.java b/src/main/java/org/apache/commons/csv/CSVStrategy.java
@@ -26,17 +26,15 @@
  */
 public class CSVStrategy implements Cloneable, Serializable {
 
-    private char delimiter;
-    private char encapsulator;
-    private char commentStart;
-    private char escape;
-    private boolean ignoreLeadingWhitespaces;
-    private boolean ignoreTrailingWhitespaces;
-    private boolean interpretUnicodeEscapes;
-    private boolean ignoreEmptyLines;
-
-    // controls for output
-    private String printerNewline = "\n";
+    private char delimiter = ',';
+    private char encapsulator = '"';
+    private char commentStart = COMMENTS_DISABLED;
+    private char escape = ESCAPE_DISABLED;
+    private boolean leadingSpacesIgnored = true;
+    private boolean trailingSpacesIgnored = true;
+    private boolean unicodeEscapesInterpreted = false;
+    private boolean emptyLinesIgnored = true;
+    private String lineSeparator = "\n";
 
     // -2 is used to signal disabled, because it won't be confused with
     // an EOF signal (-1), and because \ufffe in UTF-16 would be
@@ -46,11 +44,22 @@ public class CSVStrategy implements Cloneable, Serializable {
     public static final char ESCAPE_DISABLED = (char) -2;
     public static final char ENCAPSULATOR_DISABLED = (char) -2;
 
+    /** Standard comma separated format. */
     public static final CSVStrategy DEFAULT_STRATEGY = new CSVStrategy(',', '"', COMMENTS_DISABLED, ESCAPE_DISABLED, true, true, false, true);
+    
+    /** Excel file format (using a comma as the value delimiter). */
     public static final CSVStrategy EXCEL_STRATEGY = new CSVStrategy(',', '"', COMMENTS_DISABLED, ESCAPE_DISABLED, false, false, false, false);
+    
+    /** Tabulation delimited format. */
     public static final CSVStrategy TDF_STRATEGY = new CSVStrategy('\t', '"', COMMENTS_DISABLED, ESCAPE_DISABLED, true, true, false, true);
 
 
+    /**
+     * Creates a CSVStrategy with the default parameters.
+     */
+    public CSVStrategy() {
+    }
+
     public CSVStrategy(char delimiter, char encapsulator, char commentStart) {
         this(delimiter, encapsulator, commentStart, ESCAPE_DISABLED, true, true, false, true);
     }
@@ -62,103 +71,129 @@ public CSVStrategy(char delimiter, char encapsulator, char commentStart) {
      * @param encapsulator              a char used as value encapsulation marker
      * @param commentStart              a char used for comment identification
      * @param escape                    a char used to escape special characters in values
-     * @param ignoreLeadingWhitespaces  TRUE when leading whitespaces should be ignored
-     * @param ignoreTrailingWhitespaces TRUE when trailing whitespaces should be ignored
-     * @param interpretUnicodeEscapes   TRUE when unicode escapes should be interpreted
-     * @param ignoreEmptyLines          TRUE when the parser should skip emtpy lines
+     * @param leadingSpacesIgnored      TRUE when leading whitespaces should be ignored
+     * @param trailingSpacesIgnored     TRUE when trailing whitespaces should be ignored
+     * @param unicodeEscapesInterpreted TRUE when unicode escapes should be interpreted
+     * @param emptyLinesIgnored         TRUE when the parser should skip emtpy lines
      */
     public CSVStrategy(
             char delimiter,
             char encapsulator,
             char commentStart,
             char escape,
-            boolean ignoreLeadingWhitespaces,
-            boolean ignoreTrailingWhitespaces,
-            boolean interpretUnicodeEscapes,
-            boolean ignoreEmptyLines) {
+            boolean leadingSpacesIgnored,
+            boolean trailingSpacesIgnored,
+            boolean unicodeEscapesInterpreted,
+            boolean emptyLinesIgnored) {
         this.delimiter = delimiter;
         this.encapsulator = encapsulator;
         this.commentStart = commentStart;
         this.escape = escape;
-        this.ignoreLeadingWhitespaces = ignoreLeadingWhitespaces;
-        this.ignoreTrailingWhitespaces = ignoreTrailingWhitespaces;
-        this.interpretUnicodeEscapes = interpretUnicodeEscapes;
-        this.ignoreEmptyLines = ignoreEmptyLines;
-    }
-
-    public void setDelimiter(char delimiter) {
-        this.delimiter = delimiter;
+        this.leadingSpacesIgnored = leadingSpacesIgnored;
+        this.trailingSpacesIgnored = trailingSpacesIgnored;
+        this.unicodeEscapesInterpreted = unicodeEscapesInterpreted;
+        this.emptyLinesIgnored = emptyLinesIgnored;
     }
 
     public char getDelimiter() {
-        return this.delimiter;
+        return delimiter;
     }
 
-    public void setEncapsulator(char encapsulator) {
-        this.encapsulator = encapsulator;
+    public CSVStrategy withDelimiter(char delimiter) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        this.delimiter = delimiter;
+        return strategy;
     }
 
     public char getEncapsulator() {
-        return this.encapsulator;
+        return encapsulator;
     }
 
-    public void setCommentStart(char commentStart) {
-        this.commentStart = commentStart;
+    public CSVStrategy withEncapsulator(char encapsulator) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.encapsulator = encapsulator;
+        return strategy;
     }
 
     public char getCommentStart() {
-        return this.commentStart;
+        return commentStart;
+    }
+
+    public CSVStrategy withCommentStart(char commentStart) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.commentStart = commentStart;
+        return strategy;
     }
 
     public boolean isCommentingDisabled() {
         return this.commentStart == COMMENTS_DISABLED;
     }
 
-    public void setEscape(char escape) {
-        this.escape = escape;
+    public char getEscape() {
+        return escape;
     }
 
-    public char getEscape() {
-        return this.escape;
+    public CSVStrategy withEscape(char escape) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.escape = escape;
+        return strategy;
+    }
+
+    public boolean isLeadingSpacesIgnored() {
+        return leadingSpacesIgnored;
+    }
+
+    public CSVStrategy withLeadingSpacesIgnored(boolean leadingSpacesIgnored) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.leadingSpacesIgnored = leadingSpacesIgnored;
+        return strategy;
     }
 
-    public void setIgnoreLeadingWhitespaces(boolean ignoreLeadingWhitespaces) {
-        this.ignoreLeadingWhitespaces = ignoreLeadingWhitespaces;
+    public boolean isTrailingSpacesIgnored() {
+        return trailingSpacesIgnored;
     }
 
-    public boolean getIgnoreLeadingWhitespaces() {
-        return this.ignoreLeadingWhitespaces;
+    public CSVStrategy withTrailingSpacesIgnored(boolean trailingSpacesIgnored) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.trailingSpacesIgnored = trailingSpacesIgnored;
+        return strategy;
     }
 
-    public void setIgnoreTrailingWhitespaces(boolean ignoreTrailingWhitespaces) {
-        this.ignoreTrailingWhitespaces = ignoreTrailingWhitespaces;
+    public boolean isUnicodeEscapesInterpreted() {
+        return unicodeEscapesInterpreted;
     }
 
-    public boolean getIgnoreTrailingWhitespaces() {
-        return this.ignoreTrailingWhitespaces;
+    public CSVStrategy withUnicodeEscapesInterpreted(boolean unicodeEscapesInterpreted) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.unicodeEscapesInterpreted = unicodeEscapesInterpreted;
+        return strategy;
     }
 
-    public void setUnicodeEscapeInterpretation(boolean interpretUnicodeEscapes) {
-        this.interpretUnicodeEscapes = interpretUnicodeEscapes;
+    public boolean isEmptyLinesIgnored() {
+        return emptyLinesIgnored;
     }
 
-    public boolean getUnicodeEscapeInterpretation() {
-        return this.interpretUnicodeEscapes;
+    public CSVStrategy withEmptyLinesIgnored(boolean emptyLinesIgnored) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.emptyLinesIgnored = emptyLinesIgnored;
+        return strategy;
     }
 
-    public boolean getIgnoreEmptyLines() {
-        return this.ignoreEmptyLines;
+    public String getLineSeparator() {
+        return lineSeparator;
     }
 
-    public String getPrinterNewline() {
-        return this.printerNewline;
+    public CSVStrategy withLineSeparator(String lineSeparator) {
+        CSVStrategy strategy = (CSVStrategy) clone();
+        strategy.lineSeparator = lineSeparator;
+        return strategy;
     }
 
-    public Object clone() {
+    protected Object clone() {
         try {
             return super.clone();
         } catch (CloneNotSupportedException e) {
-            throw new RuntimeException(e);  // impossible
+            throw (Error) new InternalError().initCause(e);
         }
     }
 }
diff --git a/src/test/java/org/apache/commons/csv/CSVParserTest.java b/src/test/java/org/apache/commons/csv/CSVParserTest.java
@@ -94,10 +94,8 @@ public void testNextToken2() throws IOException {
         *
         */
         String code = "1,2,3,\na,b x,c\n#foo\n\nd,e,\n\n";
-        CSVStrategy strategy = (CSVStrategy) CSVStrategy.DEFAULT_STRATEGY.clone();
-        // strategy.setIgnoreEmptyLines(false);
-        strategy.setCommentStart('#');
-
+        CSVStrategy strategy = CSVStrategy.DEFAULT_STRATEGY.withCommentStart('#');
+        
         TestCSVParser parser = new TestCSVParser(new StringReader(code), strategy);
 
 
@@ -123,8 +121,7 @@ public void testNextToken3() throws IOException {
         *       \,,
         */
         String code = "a,\\,,b\n\\,,";
-        CSVStrategy strategy = (CSVStrategy) CSVStrategy.DEFAULT_STRATEGY.clone();
-        strategy.setCommentStart('#');
+        CSVStrategy strategy = CSVStrategy.DEFAULT_STRATEGY.withCommentStart('#');
         TestCSVParser parser = new TestCSVParser(new StringReader(code), strategy);
 
         assertEquals(CSVParser.TT_TOKEN + ";a;", parser.testNextToken());
@@ -520,8 +517,7 @@ public void testDefaultStrategy() throws IOException {
 
     public void testUnicodeEscape() throws IOException {
         String code = "abc,\\u0070\\u0075\\u0062\\u006C\\u0069\\u0063";
-        CSVParser parser = new CSVParser(new StringReader(code));
-        parser.getStrategy().setUnicodeEscapeInterpretation(true);
+        CSVParser parser = new CSVParser(new StringReader(code), CSVStrategy.DEFAULT_STRATEGY.withUnicodeEscapesInterpreted(true));
         String[] data = parser.getLine();
         assertEquals(2, data.length);
         assertEquals("abc", data[0]);
diff --git a/src/test/java/org/apache/commons/csv/CSVStrategyTest.java b/src/test/java/org/apache/commons/csv/CSVStrategyTest.java

Original file line number	Diff line number	Diff line change
`@@ -58,7 +58,7 @@ public CSVPrinter(Writer out, CSVStrategy strategy) {`
`58`	`58`	`* Output a blank line`
`59`	`59`	`*/`
`60`	`60`	`public void println() throws IOException {`
`61`		`- out.write(strategy.getPrinterNewline());`
	`61`	`+ out.write(strategy.getLineSeparator());`
`62`	`62`	`newLine = true;`
`63`	`63`	`}`
`64`	`64`