split more

ilyatikhonov · Jun 3, 2015 · 2282dba · 2282dba
1 parent 43be624
commit 2282dba
Show file tree

Hide file tree

Showing 10 changed files with 329 additions and 301 deletions.
diff --git a/.gitignore b/.gitignore
@@ -1,6 +1,7 @@
 *.o
 *.i
 *.s
+*.d
 
 *.png
 *.jpg

diff --git a/Makefile b/Makefile
@@ -1,12 +1,14 @@
 CC:=gcc
-CFLAGS:=-std=c11 -Wall -Wextra -Winline -pedantic -Ofast -march=pentium4 -s -DNDEBUG
+CFLAGS:=-std=c11 -Wall -Wextra -Winline -pedantic -Ofast -march=pentium4 -DNDEBUG
 #CFLAGS:=-std=c11 -Wall -Wextra -pedantic -Og -g
+LFLAGS:=-s
 LIBS:=-ljpeg -lpng -lfftw3f -lm
+OBJS:=jpeg2png.o utils.o jpeg.o png.o box.o upsample.o compute.o
 
-SRCS:=jpeg2png.c utils.c jpeg.c
+jpeg2png: $(OBJS)
+	$(CC) $^ -o $@ $(LFLAGS) $(LIBS)
 
-jpeg2png: jpeg2png.o utils.o jpeg.o png.o box.o
-	$(CC) $^ -o $@ $(LIBS)
+-include $(OBJS:.o=.d)
 
-%o: %.c *.h
-	$(CC) $< -o $@ $(CFLAGS)
+%.o: %.c
+	$(CC) -MMD $< -c -o $@ $(CFLAGS)
diff --git a/compute.c b/compute.c
@@ -0,0 +1,218 @@
+#include <stdint.h>
+#include <fftw3.h>
+
+#include "jpeg2png.h"
+#include "compute.h"
+#include "utils.h"
+#include "box.h"
+
+static float compute_step(struct coef *coef, float *objective_gradient, float *fdata_x, float *fdata_y, float weight, float step_size) {
+        int w = coef->w;
+        int h = coef->h;
+        float *fdata = coef->fdata;
+        float alpha = weight / sqrt(4. / 2.);
+
+        for(int i = 0; i < h * w; i++) {
+                objective_gradient[i] = 0.;
+        }
+
+        float tv = 0.;
+        for(int y = 0; y < h; y++) {
+                for(int x = 0; x < w; x++) {
+                        // forward gradient x
+                        float g_x = x >= w-1 ? 0. : *p(fdata, x+1, y, w, h) - *p(fdata, x, y, w, h);
+                        // forward gradient y
+                        float g_y = y >= h-1 ? 0. : *p(fdata, x, y+1, w, h) - *p(fdata, x, y, w, h);
+                        // norm
+                        float g_norm = sqrt(g_x * g_x + g_y * g_y);
+                        tv += g_norm;
+                        // compute derivatives
+                        if(g_norm != 0) {
+                                *p(objective_gradient, x, y, w, h) += -(g_x + g_y) / g_norm;
+                                if(x < w-1) {
+                                        *p(objective_gradient, x+1, y, w, h) += g_x / g_norm;
+                                }
+                                if(y < h-1) {
+                                        *p(objective_gradient, x, y+1, w, h) += g_y / g_norm;
+                                }
+                        }
+                        if(alpha != 0.) {
+                                *p(fdata_x, x, y, w, h) = g_x;
+                                *p(fdata_y, x, y, w, h) = g_y;
+                        }
+                }
+        }
+        // printf("tv = %f, %f\n", tv, tv / (w * h) / sqrt(2.));
+
+        float tv2 = 0;
+        if(alpha != 0.) {
+                for(int y = 0; y < h; y++) {
+                        for(int x = 0; x < w; x++) {
+                                // backward x
+                                float g_xx = x <= 0 ? 0. : *p(fdata_x, x, y, w, h) - *p(fdata_x, x-1, y, w, h);
+                                // backward x
+                                float g_yx = x <= 0 ? 0. : *p(fdata_y, x, y, w, h) - *p(fdata_y, x-1, y, w, h);
+                                // backward y
+                                float g_xy = y <= 0 ? 0. : *p(fdata_x, x, y, w, h) - *p(fdata_x, x, y-1, w, h);
+                                // backward y
+                                float g_yy = y <= 0 ? 0. : *p(fdata_y, x, y, w, h) - *p(fdata_y, x, y-1, w, h);
+                                // norm
+                                float g2_norm = sqrt(g_xx * g_xx + g_yx * g_yx + g_xy * g_xy + g_yy * g_yy);
+                                tv2 += g2_norm;
+                                // compute derivatives
+                                if(g2_norm != 0.) {
+                                        *p(objective_gradient, x, y, w, h) += alpha * (-(2. * g_xx + g_xy + g_yx + 2. *  g_yy) / g2_norm);
+                                        if(x > 0) {
+                                                *p(objective_gradient, x-1, y, w, h) += alpha * ((g_yx + g_xx) / g2_norm);
+                                        }
+                                        if(x < w-1) {
+                                                *p(objective_gradient, x+1, y, w, h) += alpha * ((g_xx + g_xy) / g2_norm);
+                                        }
+                                        if(y > 0) {
+                                                *p(objective_gradient, x, y-1, w, h) += alpha * ((g_yy + g_xy) / g2_norm);
+                                        }
+                                        if(y < h-1) {
+                                                *p(objective_gradient, x, y+1, w, h) += alpha * ((g_yy + g_yx) / g2_norm);
+                                        }
+                                        if(x < w-1 && y > 0) {
+                                                *p(objective_gradient, x+1, y-1, w, h) += alpha * ((-g_xy) / g2_norm);
+                                        }
+                                        if(x > 0 && y < h-1) {
+                                                *p(objective_gradient, x-1, y+1, w, h) += alpha * ((-g_yx) / g2_norm);
+                                        }
+                                }
+                        }
+                }
+                // printf("tv2 = %f, %f\n", tv2, tv2 / (w * h));
+        }
+
+        for(int i = 0; i < h * w; i++) {
+                fdata[i] -= step_size * (objective_gradient[i] / (alpha + 1.));
+        }
+
+        return (tv + alpha * tv2) / (alpha + 1.);
+}
+
+struct compute_projection_aux {
+        float * restrict q_min;
+        float * restrict q_max;
+        float *temp;
+        fftwf_plan dct;
+        fftwf_plan idct;
+};
+
+static void compute_projection_init(struct coef *coef, uint16_t quant_table[64],struct compute_projection_aux *aux) {
+        int w = coef->w;
+        int h = coef->h;
+
+        float *q_max = fftwf_alloc_real(h * w);
+        if(!q_max) { die("allocation error"); }
+        float *q_min = fftwf_alloc_real(h * w);
+        if(!q_min) { die("allocation error"); }
+        int blocks = (h / 8) * (w / 8);
+
+        for(int i = 0; i < blocks; i++) {
+                for(int j = 0; j < 64; j++) {
+                       q_max[i*64+j] = (coef->data[i*64+j] + 0.5) * quant_table[j];
+                       q_min[i*64+j] = (coef->data[i*64+j] - 0.5) * quant_table[j];
+                }
+        }
+
+        for(int i = 0; i < blocks; i++) {
+                for(int v = 0; v < 8; v++) {
+                        for(int u = 0; u < 8; u++) {
+                                q_max[i*64 + v*8+u] /= a(u) * a(v);
+                                q_min[i*64 + v*8+u] /= a(u) * a(v);
+                        }
+                }
+        }
+
+        aux->q_min = q_min;
+        aux->q_max = q_max;
+
+        float *temp = fftwf_alloc_real(h * w);
+        if(!temp) { die("allocation error"); }
+
+        aux->temp = temp;
+
+        fftwf_plan dct = fftwf_plan_many_r2r(
+                2, (int[]){8, 8}, blocks,
+                temp, (int[]){8, 8}, 1, 64,
+                temp, (int[]){8, 8}, 1, 64,
+                (void*)(int[]){FFTW_REDFT10, FFTW_REDFT10}, FFTW_ESTIMATE);
+
+        aux->dct = dct;
+
+        fftwf_plan idct = fftwf_plan_many_r2r(
+                2, (int[]){8, 8}, blocks,
+                temp, (int[]){8, 8}, 1, 64,
+                temp, (int[]){8, 8}, 1, 64,
+                (void*)(int[]){FFTW_REDFT01, FFTW_REDFT01}, FFTW_ESTIMATE);
+
+        aux->idct = idct;
+}
+
+static void compute_projection_destroy(struct compute_projection_aux *aux) {
+        fftwf_destroy_plan(aux->idct);
+        fftwf_destroy_plan(aux->dct);
+        fftwf_free(aux->temp);
+        fftwf_free(aux->q_min);
+        fftwf_free(aux->q_max);
+}
+
+static void compute_projection(struct coef *coef, struct compute_projection_aux *aux) {
+        int w = coef->w;
+        int h = coef->h;
+        float *fdata = coef->fdata;
+
+        float *temp = aux->temp;
+
+        int blocks = (h / 8) * (w / 8);
+
+        box(fdata, temp, w, h);
+
+        fftwf_execute(aux->dct);
+        for(int i = 0; i < h * w; i++) {
+                temp[i] /= 16.;
+        }
+
+        for(int i = 0; i < h * w; i++) {
+                temp[i] = CLAMP(temp[i], aux->q_min[i], aux->q_max[i]);
+        }
+
+        fftwf_execute(aux->idct);
+        for(int i = 0; i < blocks * 64; i++) {
+                temp[i] /= 16.;
+        }
+
+        unbox(temp, fdata, w, h);
+}
+
+void compute(struct coef *coef, uint16_t quant_table[64]) {
+        struct compute_projection_aux cpa;
+        compute_projection_init(coef, quant_table, &cpa);
+
+        int h = coef->h;
+        int w = coef->w;
+
+        float *fdata_x = fftwf_alloc_real(h * w);
+        if(!fdata_x) { die("allocation error"); }
+        float *fdata_y = fftwf_alloc_real(h * w);
+        if(!fdata_y) { die("allocation error"); }
+        float *objective_gradient = fftwf_alloc_real(h * w);
+        if(!objective_gradient) { die("allocation error"); }
+
+        const int N = 100;
+        float tv;
+        for(int i = 0; i < N; i++) {
+                compute_projection(coef, &cpa);
+                tv = compute_step(coef, fdata_x, fdata_y, objective_gradient, 0.3, 1. / sqrt(1 + N));
+        }
+
+        printf("objective = %f, %f\n", tv, tv / (coef->w * coef->h) / sqrt(2.));
+
+        fftwf_free(fdata_x);
+        fftwf_free(fdata_y);
+        fftwf_free(objective_gradient);
+        compute_projection_destroy(&cpa);
+}
diff --git a/compute.h b/compute.h
@@ -0,0 +1,8 @@
+#ifndef JPEG2PNG_COMPUTE_H
+#define JPEG2PNG_COMPUTE_H
+
+#include <stdint.h>
+
+void compute(struct coef *coef, uint16_t quant_table[64]);
+
+#endif
diff --git a/jpeg.c b/jpeg.c
@@ -1,9 +1,12 @@
+#include <assert.h>
 #include <stdlib.h>
 #include <stdio.h>
 #include <stdbool.h>
+#include <stdint.h>
 #include <string.h>
 
 #include <jpeglib.h>
+#include <fftw3.h>
 
 #include "jpeg.h"
 #include "utils.h"
@@ -47,3 +50,29 @@ void read_jpeg(FILE *in, struct jpeg *jpeg) {
         }
         jpeg_destroy_decompress(&d);
 }
+
+void decode_coefficients(struct coef *coef, uint16_t *quant_table) {
+        coef->fdata = fftwf_alloc_real(coef->h * coef->w);
+        if(!coef->fdata) { die("allocation error"); }
+        int blocks = (coef->h / 8) * (coef->w / 8);
+        for(int i = 0; i < blocks; i++) {
+                for(int j = 0; j < 64; j++) {
+                        coef->fdata[i*64+j] = coef->data[i*64+j] * quant_table[j];
+                }
+                for(int v = 0; v < 8; v++) {
+                        for(int u = 0; u < 8; u++) {
+                                coef->fdata[i*64 + v*8+u] /= a(u) * a(v);
+                        }
+                }
+        }
+        fftwf_plan p = fftwf_plan_many_r2r(
+                2, (int[]){8, 8}, blocks,
+                coef->fdata, (int[]){8, 8}, 1, 64,
+                coef->fdata, (int[]){8, 8}, 1, 64,
+                (void*)(int[]){FFTW_REDFT01, FFTW_REDFT01}, FFTW_ESTIMATE);
+        fftwf_execute(p);
+        fftwf_destroy_plan(p);
+        for(int i = 0; i < blocks * 64; i++) {
+                coef->fdata[i] /= 16.;
+        }
+}
diff --git a/jpeg.h b/jpeg.h
@@ -2,6 +2,7 @@
 #define JPEG2PNG_JPEG_H
 
 #include <stdio.h>
+#include <stdint.h>
 
 #include "jpeg2png.h"
 
@@ -13,4 +14,5 @@ struct jpeg {
 };
 
 void read_jpeg(FILE *in, struct jpeg *jpeg);
+void decode_coefficients(struct coef *coef, uint16_t *quant_table);
 #endif
-Original file line number
+Diff line change
@@ -1,6 +1,7 @@
     *.o
     *.i
     *.s
+    *.d
     *.png
     *.jpg
@@ Expand Down @@