Removed Default Convert Options

nicolaspearson · nicolaspearson · commit 7f67e2373fa2 · 2019-01-31T10:32:14.000+02:00
diff --git a/coverage/badge-branches.svg b/coverage/badge-branches.svg
@@ -1 +1 @@
-<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="152" height="20"><linearGradient id="b" x2="0" y2="100%"><stop offset="0" stop-color="#bbb" stop-opacity=".1"/><stop offset="1" stop-opacity=".1"/></linearGradient><clipPath id="a"><rect width="152" height="20" rx="3" fill="#fff"/></clipPath><g clip-path="url(#a)"><path fill="#555" d="M0 0h117v20H0z"/><path fill="#dfb317" d="M117 0h35v20H117z"/><path fill="url(#b)" d="M0 0h152v20H0z"/></g><g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110"> <text x="595" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="1070">Coverage:branches</text><text x="595" y="140" transform="scale(.1)" textLength="1070">Coverage:branches</text><text x="1335" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="250">80%</text><text x="1335" y="140" transform="scale(.1)" textLength="250">80%</text></g> </svg>
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="170" height="20"><linearGradient id="b" x2="0" y2="100%"><stop offset="0" stop-color="#bbb" stop-opacity=".1"/><stop offset="1" stop-opacity=".1"/></linearGradient><clipPath id="a"><rect width="170" height="20" rx="3" fill="#fff"/></clipPath><g clip-path="url(#a)"><path fill="#555" d="M0 0h117v20H0z"/><path fill="#e05d44" d="M117 0h53v20H117z"/><path fill="url(#b)" d="M0 0h170v20H0z"/></g><g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110"> <text x="595" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="1070">Coverage:branches</text><text x="595" y="140" transform="scale(.1)" textLength="1070">Coverage:branches</text><text x="1425" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="430">78.33%</text><text x="1425" y="140" transform="scale(.1)" textLength="430">78.33%</text></g> </svg>
diff --git a/coverage/badge-lines.svg b/coverage/badge-lines.svg
@@ -1 +1 @@
-<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="146" height="20"><linearGradient id="b" x2="0" y2="100%"><stop offset="0" stop-color="#bbb" stop-opacity=".1"/><stop offset="1" stop-opacity=".1"/></linearGradient><clipPath id="a"><rect width="146" height="20" rx="3" fill="#fff"/></clipPath><g clip-path="url(#a)"><path fill="#555" d="M0 0h93v20H0z"/><path fill="#dfb317" d="M93 0h53v20H93z"/><path fill="url(#b)" d="M0 0h146v20H0z"/></g><g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110"> <text x="475" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="830">Coverage:lines</text><text x="475" y="140" transform="scale(.1)" textLength="830">Coverage:lines</text><text x="1185" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="430">86.99%</text><text x="1185" y="140" transform="scale(.1)" textLength="430">86.99%</text></g> </svg>
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="146" height="20"><linearGradient id="b" x2="0" y2="100%"><stop offset="0" stop-color="#bbb" stop-opacity=".1"/><stop offset="1" stop-opacity=".1"/></linearGradient><clipPath id="a"><rect width="146" height="20" rx="3" fill="#fff"/></clipPath><g clip-path="url(#a)"><path fill="#555" d="M0 0h93v20H0z"/><path fill="#dfb317" d="M93 0h53v20H93z"/><path fill="url(#b)" d="M0 0h146v20H0z"/></g><g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110"> <text x="475" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="830">Coverage:lines</text><text x="475" y="140" transform="scale(.1)" textLength="830">Coverage:lines</text><text x="1185" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="430">86.21%</text><text x="1185" y="140" transform="scale(.1)" textLength="430">86.21%</text></g> </svg>
diff --git a/coverage/badge-statements.svg b/coverage/badge-statements.svg
@@ -1 +1 @@
-<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="182" height="20"><linearGradient id="b" x2="0" y2="100%"><stop offset="0" stop-color="#bbb" stop-opacity=".1"/><stop offset="1" stop-opacity=".1"/></linearGradient><clipPath id="a"><rect width="182" height="20" rx="3" fill="#fff"/></clipPath><g clip-path="url(#a)"><path fill="#555" d="M0 0h129v20H0z"/><path fill="#dfb317" d="M129 0h53v20H129z"/><path fill="url(#b)" d="M0 0h182v20H0z"/></g><g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110"> <text x="655" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="1190">Coverage:statements</text><text x="655" y="140" transform="scale(.1)" textLength="1190">Coverage:statements</text><text x="1545" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="430">86.99%</text><text x="1545" y="140" transform="scale(.1)" textLength="430">86.99%</text></g> </svg>
+<svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" width="182" height="20"><linearGradient id="b" x2="0" y2="100%"><stop offset="0" stop-color="#bbb" stop-opacity=".1"/><stop offset="1" stop-opacity=".1"/></linearGradient><clipPath id="a"><rect width="182" height="20" rx="3" fill="#fff"/></clipPath><g clip-path="url(#a)"><path fill="#555" d="M0 0h129v20H0z"/><path fill="#dfb317" d="M129 0h53v20H129z"/><path fill="url(#b)" d="M0 0h182v20H0z"/></g><g fill="#fff" text-anchor="middle" font-family="DejaVu Sans,Verdana,Geneva,sans-serif" font-size="110"> <text x="655" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="1190">Coverage:statements</text><text x="655" y="140" transform="scale(.1)" textLength="1190">Coverage:statements</text><text x="1545" y="150" fill="#010101" fill-opacity=".3" transform="scale(.1)" textLength="430">86.21%</text><text x="1545" y="140" transform="scale(.1)" textLength="430">86.21%</text></g> </svg>
diff --git a/src/index.ts b/src/index.ts
@@ -145,13 +145,6 @@ class Ocr {
 		args.push('-density');
 		args.push(`${options && options.convertDensity ? options.convertDensity : 300}`);
 		args.push(filePath);
-		args.push('-depth');
-		args.push('8');
-		args.push('-strip');
-		args.push('-background');
-		args.push('white');
-		args.push('-alpha');
-		args.push('off');
 		if (options && options.convertArgs) {
 			// Parse all provided options to command line arguments
 			for (const [key, value] of Object.entries(options.convertArgs)) {
diff --git a/test/extract-text.spec.ts b/test/extract-text.spec.ts
@@ -3,6 +3,18 @@ import * as temp from 'temp';
 
 import { ExtractTextOptions, Ocr } from '../src/index';
 
+const convertArgs = {
+	quality: '100',
+	trim: '',
+	depth: '8',
+	strip: '',
+	background: 'white',
+	alpha: 'off'
+};
+
+// tslint:disable object-literal-key-quotes
+const tesseractArgs = { '-psm': 6, c: 'preserve_interword_spaces=1' };
+
 describe('Extract Text Tests', () => {
 	it('should be able to extract pdf text from single-page.pdf', async (done) => {
 		jest.setTimeout(15 * 1000);
@@ -11,7 +23,10 @@ describe('Extract Text Tests', () => {
 		const pdfPath = path.join(__dirname, relativePath);
 
 		try {
-			const result: string = await Ocr.extractText(pdfPath);
+			const options: ExtractTextOptions = {
+				convertArgs
+			};
+			const result: string = await Ocr.extractText(pdfPath, options);
 			expect(result).toBeDefined();
 			expect(result).toContain('00001-001-0002');
 		} catch (error) {
@@ -29,7 +44,10 @@ describe('Extract Text Tests', () => {
 		const pdfPath = path.join(__dirname, relativePath);
 
 		try {
-			const result: string = await Ocr.extractText(pdfPath);
+			const options: ExtractTextOptions = {
+				convertArgs
+			};
+			const result: string = await Ocr.extractText(pdfPath, options);
 			expect(result).toBeDefined();
 			expect(result).toContain('00001-001-0002');
 		} catch (error) {
@@ -41,13 +59,16 @@ describe('Extract Text Tests', () => {
 	});
 
 	it('should be able to extract pdf text from multi-page.pdf', async (done) => {
-		jest.setTimeout(15 * 1000);
+		jest.setTimeout(25 * 1000);
 		const fileName = 'multi-page.pdf';
 		const relativePath = path.join('sample', fileName);
 		const pdfPath = path.join(__dirname, relativePath);
 
 		try {
-			const options: ExtractTextOptions = { convertDensity: 400, convertArgs: { trim: '' } };
+			const options: ExtractTextOptions = {
+				convertDensity: 600,
+				convertArgs
+			};
 			const result: string = await Ocr.extractText(pdfPath, options);
 			expect(result).toBeDefined();
 			expect(result).toContain('National Airspace System');
@@ -67,7 +88,11 @@ describe('Extract Text Tests', () => {
 		const pdfPath = path.join(__dirname, relativePath);
 
 		try {
-			const options: ExtractTextOptions = { pdfToTextArgs: { f: 1, l: 4 } };
+			const options: ExtractTextOptions = {
+				pdfToTextArgs: { f: 1, l: 4 },
+				convertDensity: 600,
+				convertArgs
+			};
 			const result: string = await Ocr.extractText(pdfPath, options);
 			expect(result).toBeDefined();
 			expect(result).toContain('TraceMonkey');
@@ -81,17 +106,19 @@ describe('Extract Text Tests', () => {
 	});
 
 	it('should be able to extract text from sample.png', async (done) => {
-		jest.setTimeout(15 * 1000);
+		jest.setTimeout(25 * 1000);
 		const fileName = 'sample.png';
 		const relativePath = path.join('sample', fileName);
 		const pngPath = path.join(__dirname, relativePath);
 
 		try {
 			const tmpDir = temp.mkdirSync('tmp');
-			// tslint:disable object-literal-key-quotes
+
 			const options: ExtractTextOptions = {
+				convertDensity: 600,
+				convertArgs,
 				tesseractLang: 'eng',
-				tesseractArgs: { '-psm': 6, c: 'preserve_interword_spaces=1' }
+				tesseractArgs
 			};
 			const result: string = await Ocr.invokeImageOcr(tmpDir, pngPath, options);
 			expect(result).toBeDefined();
@@ -105,17 +132,24 @@ describe('Extract Text Tests', () => {
 	});
 
 	it('should be able to extract text from sample-low.jpg', async (done) => {
-		jest.setTimeout(15 * 1000);
+		jest.setTimeout(25 * 1000);
 		const fileName = 'sample-low.jpg';
 		const relativePath = path.join('sample', fileName);
 		const jpgPath = path.join(__dirname, relativePath);
 
 		try {
 			const options: ExtractTextOptions = {
 				convertDensity: 600,
-				convertArgs: { trim: '' },
+				convertArgs: {
+					...convertArgs,
+					verbose: '',
+					flatten: '',
+					contrast: '',
+					'auto-level': '',
+					sharpen: '0x4.0'
+				},
 				tesseractLang: 'eng',
-				tesseractArgs: { '-psm': 6 }
+				tesseractArgs
 			};
 			const result: string = await Ocr.extractText(jpgPath, options);
 			expect(result).toBeDefined();