This repository was archived by the owner on Nov 7, 2020. It is now read-only.
File tree 15 files changed +39
-34
lines changed
src/com/morethanheroic/warc/service
test/com/mixnode/test/warcreader
15 files changed +39
-34
lines changed Original file line number Diff line number Diff line change 1
1
<project >
2
2
<modelVersion >4.0.0</modelVersion >
3
- <groupId >com.mixnode.utils </groupId >
4
- <artifactId >warcreader </artifactId >
3
+ <groupId >com.morethanheroic </groupId >
4
+ <artifactId >warc </artifactId >
5
5
<version >1.0</version >
6
6
<packaging >jar</packaging >
7
7
<name >WARC-reader</name >
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader ;
1
+ package com .morethanheroic . warc . service ;
2
2
3
3
import java .io .IOException ;
4
4
5
- @ SuppressWarnings ("serial" )
6
5
public class WarcFormatException extends IOException {
7
6
8
7
public WarcFormatException (String message ) {
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader ;
1
+ package com .morethanheroic . warc . service ;
2
2
3
- import com .mixnode .warcreader .record .WarcRecord ;
3
+ import com .morethanheroic .warc .service .http .HttpParser ;
4
+ import com .morethanheroic .warc .service .record .domain .WarcRecord ;
4
5
5
- import com .mixnode . warcreader .service .WarcRecordFactory ;
6
+ import com .morethanheroic . warc .service . record .WarcRecordFactory ;
6
7
import java .io .Closeable ;
7
8
import java .io .IOException ;
8
9
import java .io .InputStream ;
13
14
import org .apache .http .message .HeaderGroup ;
14
15
15
16
/**
16
- * WarcReader class provides basic functions to read and parse a WARC file. Providing a compressed
17
- * or an uncompressed stream of WARC file, WarcReader reads WARC records and parses it to a
18
- * WarcRecord object
19
- *
20
- * @author Hadi Jooybar
17
+ * This class provides basic functions to read and parse a WARC file. Providing a compressed or an
18
+ * uncompressed stream of WARC file, WarcReader reads WARC records and parses them to {@link
19
+ * WarcRecord} objects.
21
20
*/
22
21
public class WarcReader implements Closeable {
23
22
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader . record ;
1
+ package com .morethanheroic . warc . service . content . domain ;
2
2
3
3
import java .io .InputStream ;
4
4
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader . record ;
1
+ package com .morethanheroic . warc . service . content . domain ;
2
2
3
3
import java .io .InputStream ;
4
4
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader .service ;
1
+ package com .morethanheroic . warc .service . content . request ;
2
2
3
- import com .mixnode .warcreader .WarcFormatException ;
4
- import com .mixnode .warcreader .record .RequestContentBlock ;
3
+ import com .morethanheroic .warc .service .WarcFormatException ;
4
+ import com .morethanheroic .warc .service .content .request .domain .RequestContentBlock ;
5
+ import com .morethanheroic .warc .service .header .HeaderParser ;
5
6
import java .io .IOException ;
6
7
import org .apache .commons .io .input .BoundedInputStream ;
7
8
import org .apache .http .HttpException ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader . record ;
1
+ package com .morethanheroic . warc . service . content . request . domain ;
2
2
3
+ import com .morethanheroic .warc .service .content .domain .WarcContentBlock ;
3
4
import java .io .InputStream ;
4
5
import java .util .Collections ;
5
6
import java .util .Map ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader .service ;
1
+ package com .morethanheroic . warc .service . content . response ;
2
2
3
- import com .mixnode .warcreader .WarcFormatException ;
4
- import com .mixnode .warcreader .record .ResponseContentBlock ;
3
+ import com .morethanheroic .warc .service .WarcFormatException ;
4
+ import com .morethanheroic .warc .service .content .response .domain .ResponseContentBlock ;
5
+ import com .morethanheroic .warc .service .header .HeaderParser ;
5
6
import java .io .IOException ;
6
7
import org .apache .commons .io .input .BoundedInputStream ;
7
8
import org .apache .http .Header ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader . record ;
1
+ package com .morethanheroic . warc . service . content . response . domain ;
2
2
3
+ import com .morethanheroic .warc .service .content .domain .WarcContentBlock ;
3
4
import java .io .InputStream ;
4
5
import java .util .Collections ;
5
6
import java .util .Map ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader .service ;
1
+ package com .morethanheroic . warc .service . header ;
2
2
3
3
import java .util .Arrays ;
4
4
import java .util .Map ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader ;
1
+ package com .morethanheroic . warc . service . http ;
2
2
3
3
import java .io .ByteArrayOutputStream ;
4
4
import java .io .IOException ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader .service ;
1
+ package com .morethanheroic . warc .service . record ;
2
2
3
- import com .mixnode .warcreader .record .DefaultContentBlock ;
4
- import com .mixnode .warcreader .record .WarcContentBlock ;
5
- import com .mixnode .warcreader .record .WarcRecord ;
6
- import com .mixnode .warcreader .record .WarcType ;
3
+ import com .morethanheroic .warc .service .content .domain .DefaultContentBlock ;
4
+ import com .morethanheroic .warc .service .content .domain .WarcContentBlock ;
5
+ import com .morethanheroic .warc .service .content .request .RequestContentBlockFactory ;
6
+ import com .morethanheroic .warc .service .content .response .ResponseContentBlockFactory ;
7
+ import com .morethanheroic .warc .service .record .domain .WarcRecord ;
8
+ import com .morethanheroic .warc .service .record .domain .WarcType ;
7
9
import java .io .IOException ;
8
10
import java .util .Arrays ;
9
11
import java .util .Collections ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader . record ;
1
+ package com .morethanheroic . warc . service . record . domain ;
2
2
3
+ import com .morethanheroic .warc .service .content .domain .WarcContentBlock ;
3
4
import java .util .Collections ;
4
5
import java .util .Map ;
5
6
import java .util .Optional ;
Original file line number Diff line number Diff line change 1
- package com .mixnode . warcreader . record ;
1
+ package com .morethanheroic . warc . service . record . domain ;
2
2
3
3
/**
4
4
* WarcType specifies the type of a WARC record. 'WARC-Type' field is mandatory for all WARC
Original file line number Diff line number Diff line change 1
1
package com .mixnode .test .warcreader ;
2
2
3
- import com .mixnode . warcreader .WarcReader ;
4
- import com .mixnode . warcreader . record .WarcRecord ;
3
+ import com .morethanheroic . warc . service .WarcReader ;
4
+ import com .morethanheroic . warc . service . record . domain .WarcRecord ;
5
5
6
- import com .mixnode . warcreader . record .WarcType ;
6
+ import com .morethanheroic . warc . service . record . domain .WarcType ;
7
7
import java .io .File ;
8
8
import java .io .FileInputStream ;
9
9
import java .io .IOException ;
You can’t perform that action at this time.
0 commit comments