Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
73 changes: 69 additions & 4 deletions CHANGES.md
Original file line number Diff line number Diff line change
@@ -1,8 +1,73 @@
Unreleased
----------

#### Dependency upgrades
2.0.0
-----

### Removals

#### Removed Apache HttpClient 3.1

`HTTPSeekableLineReaderFactory` and `ZipNumBlockLoader` now default to HttpClient 4.3.

| Removed | Replacement |
|-----------------------------------------------------------|--------------------------------------|
| `org.apache.commons.httpclient.URIException` | `org.archive.url.URIException` |
| `org.apache.commons.httpclient.Header` | `org.archive.format.http.HttpHeader` |
| `org.archive.httpclient.HttpRecorderGetMethod` | |
| `org.archive.httpclient.HttpRecorderMethod` | |
| `org.archive.httpclient.HttpRecorderPostMethod` | |
| `org.archive.httpclient.SingleHttpConnectionManager` | |
| `org.archive.httpclient.ThreadLocalHttpConnectionManager` | |

#### Removed deprecated versions of renamed classes

| Removed | Replacement |
|-----------------------------------------------|--------------------------------------------------|
| `org.archive.io.ArchiveFileConstants` | `org.archive.format.ArchiveFileConstants` |
| `org.archive.io.GzipHeader` | `org.archive.util.zip.GzipHeader` |
| `org.archive.io.GZIPMembersInputStream` | `org.archive.util.zip.GZIPMembersInputStream` |
| `org.archive.io.NoGzipMagicException` | `org.archive.util.zip.NoGzipMagicException` |
| `org.archive.io.arc.ARCConstants` | `org.archive.format.arc.ARCConstants` |
| `org.archive.io.warc.WARCConstants` | `org.archive.format.warc.WARCConstants` |
| `org.archive.url.DefaultIACanonicalizerRules` | `org.archive.url.AggressiveIACanonicalizerRules` |
| `org.archive.url.DefaultIAURLCanonicalizer` | `org.archive.url.AggressiveIAURLCanonicalizer` |
| `org.archive.url.GoogleURLCanonicalizer` | `org.archive.url.BasicURLCanonicalizer` |

#### Removed deprecated methods

| Removed | Replacement |
|-----------------------------------------------|-------------------------------------------|
| `ANVLRecord(int)` | `ANVLRecord()` |
| `DevUtils.betterPrintStack(RuntimeException)` | `Throwable.printStackStrace()` |
| `Recorder.getReplayCharSequence()` | `Recorder.getContentReplayCharSequence()` |
| `Reporter.shortReportLineTo(PrintWriter)` | `Reporter.reportTo(PrintWriter)` |

##### Removed usages of constant interfaces

Static imports should be used instead.

* `ArchiveFileConstants` is no longer implemented by:
* `ArchiveReader`
* `ArchiveReaderFactory`
* `WARCWriter`
* `WriterPool`
* `WriterPoolMember`
* `ARCConstants` is no longer implemented by:
* `ARCReader`
* `ARCReaderFactory`
* `ARCRecord`
* `ARCRecordMetaData`
* `ARCUtils`
* `ARCWriter`
* `WARCConstants` is no longer implemented by:
* `WARCReader`
* `WARCReaderFactory`
* `WARCRecord`
* `WARCWriter`

### Dependency upgrades

- **commons-io**: 2.18.0 → 2.19.0
- **guava**: 33.3.1-jre → 33.4.8-jre
- **json**: 20240303 → 20250517
- **junit**: 4.13.2 → 5.12.2

1.3.0
Expand Down
17 changes: 13 additions & 4 deletions pom.xml
Original file line number Diff line number Diff line change
Expand Up @@ -61,13 +61,13 @@
<dependency>
<groupId>com.google.guava</groupId>
<artifactId>guava</artifactId>
<version>33.3.1-jre</version>
<version>33.4.8-jre</version>
</dependency>

<dependency>
<groupId>org.json</groupId>
<artifactId>json</artifactId>
<version>20240303</version>
<version>20250517</version>
</dependency>
<dependency>
<groupId>org.htmlparser</groupId>
Expand Down Expand Up @@ -141,7 +141,7 @@
<dependency>
<groupId>commons-io</groupId>
<artifactId>commons-io</artifactId>
<version>2.18.0</version>
<version>2.19.0</version>
</dependency>

<dependency>
Expand All @@ -162,7 +162,7 @@
<plugin>
<groupId>org.apache.maven.plugins</groupId>
<artifactId>maven-compiler-plugin</artifactId>
<version>2.3.2</version>
<version>3.14.0</version>
<configuration>
<source>8</source>
<target>8</target>
Expand Down Expand Up @@ -265,6 +265,15 @@
</plugins>
</build>
</profile>
<profile>
<id>jdk9-plus</id>
<activation>
<jdk>[9,)</jdk>
</activation>
<properties>
<maven.compiler.release>8</maven.compiler.release>
</properties>
</profile>
</profiles>

</project>
24 changes: 0 additions & 24 deletions src/main/java/org/archive/io/ArchiveFileConstants.java

This file was deleted.

9 changes: 5 additions & 4 deletions src/main/java/org/archive/io/ArchiveReader.java
Original file line number Diff line number Diff line change
Expand Up @@ -42,13 +42,15 @@

import com.google.common.io.CountingInputStream;

import static org.archive.format.ArchiveFileConstants.*;


/**
* Reader for an Archive file of Archive {@link ArchiveRecord}s.
* @author stack
* @version $Date$ $Version$
*/
public abstract class ArchiveReader implements ArchiveFileConstants, Iterable<ArchiveRecord>, Closeable {
public abstract class ArchiveReader implements Iterable<ArchiveRecord>, Closeable {
/**
* Is this Archive file compressed?
*/
Expand Down Expand Up @@ -601,8 +603,7 @@ public String getStrippedFileName() {
*/
public static String getStrippedFileName(String name,
final String dotFileExtension) {
name = stripExtension(name,
ArchiveFileConstants.DOT_COMPRESSED_FILE_EXTENSION);
name = stripExtension(name, DOT_COMPRESSED_FILE_EXTENSION);
return stripExtension(name, dotFileExtension);
}

Expand Down Expand Up @@ -699,7 +700,7 @@ public boolean outputRecord(final String format)
boolean result = true;
if (format.equals(CDX)) {
System.out.println(get().outputCdx(getStrippedFileName()));
} else if(format.equals(ArchiveFileConstants.DUMP)) {
} else if(format.equals(DUMP)) {
// No point digesting if dumping content.
setDigest(false);
get().dump();
Expand Down
3 changes: 2 additions & 1 deletion src/main/java/org/archive/io/ArchiveReaderFactory.java
Original file line number Diff line number Diff line change
Expand Up @@ -33,14 +33,15 @@
import org.archive.url.UsableURI;
import org.archive.util.FileUtils;

import static org.archive.format.ArchiveFileConstants.*;

/**
* Factory that returns an Archive file Reader.
* Returns Readers for ARCs or WARCs.
* @author stack
* @version $Date$ $Revision$
*/
public class ArchiveReaderFactory implements ArchiveFileConstants {
public class ArchiveReaderFactory {
// Static block to enable S3 URLs
static {
if (System.getProperty("java.protocol.handler.pkgs") != null) {
Expand Down
1 change: 1 addition & 0 deletions src/main/java/org/archive/io/ArchiveRecord.java
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@
import java.security.NoSuchAlgorithmException;
import java.util.logging.Level;

import org.archive.format.ArchiveFileConstants;
import org.archive.util.Base32;

/**
Expand Down
38 changes: 0 additions & 38 deletions src/main/java/org/archive/io/GZIPMembersInputStream.java

This file was deleted.

26 changes: 0 additions & 26 deletions src/main/java/org/archive/io/GzipHeader.java

This file was deleted.

2 changes: 1 addition & 1 deletion src/main/java/org/archive/io/HeaderedArchiveRecord.java
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@
import java.io.PrintStream;

import org.archive.format.http.HttpHeader;
import org.archive.io.arc.ARCConstants;
import org.archive.format.arc.ARCConstants;
import org.archive.util.LaxHttpParser;

/**
Expand Down
26 changes: 0 additions & 26 deletions src/main/java/org/archive/io/NoGzipMagicException.java

This file was deleted.

3 changes: 2 additions & 1 deletion src/main/java/org/archive/io/WriterPool.java
Original file line number Diff line number Diff line change
Expand Up @@ -30,6 +30,7 @@
import java.util.logging.Level;
import java.util.logging.Logger;

import org.archive.format.ArchiveFileConstants;
import org.json.JSONArray;
import org.json.JSONException;
import org.json.JSONObject;
Expand Down Expand Up @@ -215,7 +216,7 @@ public synchronized void invalidateFile(WriterPoolMember f)
// gets attention.
File file = f.getFile();
file.renameTo(new File(file.getAbsoluteFile() +
WriterPoolMember.INVALID_SUFFIX));
ArchiveFileConstants.INVALID_SUFFIX));
}

/**
Expand Down
3 changes: 2 additions & 1 deletion src/main/java/org/archive/io/WriterPoolMember.java
Original file line number Diff line number Diff line change
Expand Up @@ -38,6 +38,7 @@
import org.archive.util.FileUtils;
import org.archive.util.PropertyUtils;

import static org.archive.format.ArchiveFileConstants.*;


/**
Expand All @@ -48,7 +49,7 @@
* @author stack
* @version $Date$ $Revision$
*/
public abstract class WriterPoolMember implements ArchiveFileConstants {
public abstract class WriterPoolMember {
private final Logger logger = Logger.getLogger(this.getClass().getName());

public static final String UTF8 = "UTF-8";
Expand Down
29 changes: 0 additions & 29 deletions src/main/java/org/archive/io/arc/ARCConstants.java

This file was deleted.

3 changes: 2 additions & 1 deletion src/main/java/org/archive/io/arc/ARCReader.java
Original file line number Diff line number Diff line change
Expand Up @@ -43,6 +43,7 @@
import org.archive.io.WriterPoolMember;
import org.archive.util.ArchiveUtils;

import static org.archive.format.arc.ARCConstants.*;

/**
* Get an iterator on an ARC file or get a record by absolute position.
Expand All @@ -66,7 +67,7 @@
* @version $Date$ $Revision$
*/
public abstract class ARCReader extends ArchiveReader
implements ARCConstants, Closeable {
implements Closeable {
private final Logger logger = Logger.getLogger(ARCReader.class.getName());

/**
Expand Down
Loading