5 #include "maskengine.h"
13 MaskPackage::MaskPackage()
15 apply_mutex = new Condition(1, "MaskPackage::apply_mutex");
18 MaskPackage::~MaskPackage()
29 MaskUnit::MaskUnit(MaskEngine *engine)
32 this->engine = engine;
43 #define SQR(x) ((x) * (x))
63 void MaskUnit::draw_line_clamped(VFrame *frame,
91 unsigned char **rows = (unsigned char**)frame->get_rows();
93 if(draw_y2 != draw_y1)
95 float slope = ((float)draw_x2 - draw_x1) / ((float)draw_y2 - draw_y1);
96 int w = frame->get_w() - 1;
97 int h = frame->get_h();
99 for(float y = draw_y1; y < draw_y2; y++)
103 int x = (int)((y - draw_y1) * slope + draw_x1);
105 int x_i = CLIP(x, 0, w);
107 if(rows[y_i][x_i] == k)
116 void MaskUnit::blur_strip(float *val_p,
124 float *sp_m = src + size - 1;
126 float *vm = val_m + size - 1;
127 float initial_p = sp_p[0];
128 float initial_m = sp_m[0];
130 //printf("MaskUnit::blur_strip %d\n", size);
131 for(int k = 0; k < size; k++)
133 int terms = (k < 4) ? k : 4;
135 for(l = 0; l <= terms; l++)
137 *vp += n_p[l] * sp_p[-l] - d_p[l] * vp[-l];
138 *vm += n_m[l] * sp_m[l] - d_m[l] * vm[l];
143 *vp += (n_p[l] - bd_p[l]) * initial_p;
144 *vm += (n_m[l] - bd_m[l]) * initial_m;
152 for(int i = 0; i < size; i++)
154 float sum = val_p[i] + val_m[i];
160 void MaskUnit::do_feather(VFrame *output,
166 //printf("MaskUnit::do_feather %f\n", feather);
170 double std_dev = sqrt(-(double)(feather * feather) / (2 * log(1.0 / 255.0)));
171 div = sqrt(2 * M_PI) * std_dev;
172 constants[0] = -1.783 / std_dev;
173 constants[1] = -1.723 / std_dev;
174 constants[2] = 0.6318 / std_dev;
175 constants[3] = 1.997 / std_dev;
176 constants[4] = 1.6803 / div;
177 constants[5] = 3.735 / div;
178 constants[6] = -0.6803 / div;
179 constants[7] = -0.2598 / div;
181 n_p[0] = constants[4] + constants[6];
182 n_p[1] = exp(constants[1]) *
183 (constants[7] * sin(constants[3]) -
184 (constants[6] + 2 * constants[4]) * cos(constants[3])) +
186 (constants[5] * sin(constants[2]) -
187 (2 * constants[6] + constants[4]) * cos(constants[2]));
189 n_p[2] = 2 * exp(constants[0] + constants[1]) *
190 ((constants[4] + constants[6]) * cos(constants[3]) *
191 cos(constants[2]) - constants[5] *
192 cos(constants[3]) * sin(constants[2]) -
193 constants[7] * cos(constants[2]) * sin(constants[3])) +
194 constants[6] * exp(2 * constants[0]) +
195 constants[4] * exp(2 * constants[1]);
197 n_p[3] = exp(constants[1] + 2 * constants[0]) *
198 (constants[7] * sin(constants[3]) -
199 constants[6] * cos(constants[3])) +
200 exp(constants[0] + 2 * constants[1]) *
201 (constants[5] * sin(constants[2]) - constants[4] *
206 d_p[1] = -2 * exp(constants[1]) * cos(constants[3]) -
207 2 * exp(constants[0]) * cos(constants[2]);
209 d_p[2] = 4 * cos(constants[3]) * cos(constants[2]) *
210 exp(constants[0] + constants[1]) +
211 exp(2 * constants[1]) + exp (2 * constants[0]);
213 d_p[3] = -2 * cos(constants[2]) * exp(constants[0] + 2 * constants[1]) -
214 2 * cos(constants[3]) * exp(constants[1] + 2 * constants[0]);
216 d_p[4] = exp(2 * constants[0] + 2 * constants[1]);
218 for(int i = 0; i < 5; i++) d_m[i] = d_p[i];
221 for(int i = 1; i <= 4; i++)
222 n_m[i] = n_p[i] - d_p[i] * n_p[0];
224 double sum_n_p, sum_n_m, sum_d;
230 for(int i = 0; i < 5; i++)
237 a = sum_n_p / (1 + sum_d);
238 b = sum_n_m / (1 + sum_d);
240 for(int i = 0; i < 5; i++)
242 bd_p[i] = d_p[i] * a;
243 bd_m[i] = d_m[i] * b;
267 #define DO_FEATHER(type, max) \
269 int frame_w = input->get_w(); \
270 int frame_h = input->get_h(); \
271 int size = MAX(frame_w, frame_h); \
272 float *src = new float[size]; \
273 float *dst = new float[size]; \
274 float *val_p = new float[size]; \
275 float *val_m = new float[size]; \
276 int start_in = start_out - (int)feather; \
277 int end_in = end_out + (int)feather; \
278 if(start_in < 0) start_in = 0; \
279 if(end_in > frame_h) end_in = frame_h; \
280 int strip_size = end_in - start_in; \
281 type **in_rows = (type**)input->get_rows(); \
282 type **out_rows = (type**)output->get_rows(); \
285 /* printf("DO_FEATHER 1\n"); */ \
286 for(j = 0; j < frame_w; j++) \
288 /* printf("DO_FEATHER 1.1 %d\n", j); */ \
289 bzero(val_p, sizeof(float) * (end_in - start_in)); \
290 bzero(val_m, sizeof(float) * (end_in - start_in)); \
291 for(int l = 0, k = start_in; k < end_in; l++, k++) \
293 src[l] = (float)in_rows[k][j]; \
296 blur_strip(val_p, val_m, dst, src, strip_size, max); \
298 for(int l = start_out - start_in, k = start_out; k < end_out; l++, k++) \
300 out_rows[k][j] = (type)dst[l]; \
304 for(j = start_out; j < end_out; j++) \
306 /* printf("DO_FEATHER 2 %d\n", j); */ \
307 bzero(val_p, sizeof(float) * frame_w); \
308 bzero(val_m, sizeof(float) * frame_w); \
309 for(int k = 0; k < frame_w; k++) \
311 src[k] = (float)out_rows[j][k]; \
314 blur_strip(val_p, val_m, dst, src, frame_w, max); \
316 for(int k = 0; k < frame_w; k++) \
318 out_rows[j][k] = (type)dst[k]; \
322 /* printf("DO_FEATHER 3\n"); */ \
328 /* printf("DO_FEATHER 4\n"); */ \
338 //printf("do_feather %d\n", frame->get_color_model());
339 switch(input->get_color_model())
342 DO_FEATHER(unsigned char, 0xff);
346 DO_FEATHER(uint16_t, 0xffff);
350 DO_FEATHER(float, 1);
359 void MaskUnit::process_package(LoadPackage *package)
361 MaskPackage *ptr = (MaskPackage*)package;
363 if(engine->recalculate && ptr->part == RECALCULATE_PART)
366 if(engine->feather > 0)
367 mask = engine->temp_mask;
371 // Generated oversampling frame
372 int mask_w = mask->get_w();
373 int mask_h = mask->get_h();
374 int oversampled_package_w = mask_w * OVERSAMPLE;
375 int oversampled_package_h = (ptr->row2 - ptr->row1) * OVERSAMPLE;
376 //printf("MaskUnit::process_package 1\n");
379 (temp->get_w() != oversampled_package_w ||
380 temp->get_h() != oversampled_package_h))
385 //printf("MaskUnit::process_package 1\n");
390 oversampled_package_w,
391 oversampled_package_h,
396 //printf("MaskUnit::process_package 1 %d\n", engine->point_sets.total);
399 // Draw oversampled region of polygons on temp
400 for(int k = 0; k < engine->point_sets.total; k++)
403 unsigned char max = k + 1;
404 ArrayList<MaskPoint*> *points = engine->point_sets.values[k];
406 if(points->total < 3) continue;
407 //printf("MaskUnit::process_package 2 %d %d\n", k, points->total);
408 for(int i = 0; i < points->total; i++)
410 MaskPoint *point1 = points->values[i];
411 MaskPoint *point2 = (i >= points->total - 1) ?
413 points->values[i + 1];
416 int segments = (int)(sqrt(SQR(point1->x - point2->x) + SQR(point1->y - point2->y)));
417 float x0 = point1->x;
418 float y0 = point1->y;
419 float x1 = point1->x + point1->control_x2;
420 float y1 = point1->y + point1->control_y2;
421 float x2 = point2->x + point2->control_x1;
422 float y2 = point2->y + point2->control_y1;
423 float x3 = point2->x;
424 float y3 = point2->y;
426 for(int j = 0; j <= segments; j++)
428 float t = (float)j / segments;
430 float tpow3 = t * t * t;
432 float invtpow2 = invt * invt;
433 float invtpow3 = invt * invt * invt;
436 + 3 * t * invtpow2 * x1
437 + 3 * tpow2 * invt * x2
440 + 3 * t * invtpow2 * y1
441 + 3 * tpow2 * invt * y2
450 draw_line_clamped(temp, old_x, old_y, (int)x, (int)y, max);
458 //printf("MaskUnit::process_package 1\n");
464 // Fill in the polygon in the horizontal direction
465 for(int i = 0; i < oversampled_package_h; i++)
467 unsigned char *row = (unsigned char*)temp->get_rows()[i];
471 for(int j = 0; j < oversampled_package_w; j++)
472 if(row[j] == max) total++;
476 if(total & 0x1) total--;
477 for(int j = 0; j < oversampled_package_w; j++)
479 if(row[j] == max && total > 0)
489 if(value) row[j] = value;
502 #define DOWNSAMPLE(type, temp_type, value) \
503 for(int i = 0; i < ptr->row2 - ptr->row1; i++) \
505 type *output_row = (type*)mask->get_rows()[i + ptr->row1]; \
506 unsigned char **input_rows = (unsigned char**)temp->get_rows() + i * OVERSAMPLE; \
509 for(int j = 0; j < mask_w; j++) \
511 temp_type total = 0; \
513 /* Accumulate pixel */ \
514 for(int k = 0; k < OVERSAMPLE; k++) \
516 unsigned char *input_vector = input_rows[k] + j * OVERSAMPLE; \
517 for(int l = 0; l < OVERSAMPLE; l++) \
519 total += (input_vector[l] ? value : 0); \
524 total /= OVERSAMPLE * OVERSAMPLE; \
526 output_row[j] = total; \
531 // Downsample polygon
532 switch(mask->get_color_model())
537 value = (int)((float)engine->value / 100 * 0xff);
538 DOWNSAMPLE(unsigned char, int64_t, value);
545 value = (int)((float)engine->value / 100 * 0xffff);
546 DOWNSAMPLE(uint16_t, int64_t, value);
553 value = (float)engine->value / 100;
554 DOWNSAMPLE(float, double, value);
561 if(ptr->part == RECALCULATE_PART)
563 // The feather could span more than one package so can't do it until
564 // all packages are drawn.
565 if(get_package_number() >= engine->get_total_packages() / 2 - 1)
567 for(int i = engine->get_total_packages() / 2;
568 i < engine->get_total_packages();
571 MaskPackage *package = (MaskPackage*)engine->get_package(i);
572 package->apply_mutex->unlock();
579 if(ptr->part == APPLY_PART)
581 //printf("MaskUnit::process_package 2.1\n");
582 ptr->apply_mutex->lock("MaskUnit::process_package");
583 ptr->apply_mutex->unlock();
584 //printf("MaskUnit::process_package 2.2\n");
586 if(engine->recalculate)
589 if(engine->feather > 0) do_feather(engine->mask,
596 //printf("MaskUnit::process_package 3 %f\n", engine->feather);
602 int mask_w = engine->mask->get_w();
605 #define APPLY_MASK_SUBTRACT_ALPHA(type, max, components, do_yuv) \
607 type *output_row = (type*)engine->output->get_rows()[i]; \
608 type *mask_row = (type*)engine->mask->get_rows()[i]; \
609 int chroma_offset = (int)(max + 1) / 2; \
611 for(int j = 0; j < mask_w; j++) \
613 if(components == 4) \
615 output_row[j * 4 + 3] = output_row[j * 4 + 3] * (max - mask_row[j]) / max; \
619 output_row[j * 3] = output_row[j * 3] * (max - mask_row[j]) / max; \
621 output_row[j * 3 + 1] = output_row[j * 3 + 1] * (max - mask_row[j]) / max; \
622 output_row[j * 3 + 2] = output_row[j * 3 + 2] * (max - mask_row[j]) / max; \
626 output_row[j * 3 + 1] += chroma_offset * mask_row[j] / max; \
627 output_row[j * 3 + 2] += chroma_offset * mask_row[j] / max; \
633 #define APPLY_MASK_MULTIPLY_ALPHA(type, max, components, do_yuv) \
635 type *output_row = (type*)engine->output->get_rows()[i]; \
636 type *mask_row = (type*)engine->mask->get_rows()[i]; \
637 int chroma_offset = (int)(max + 1) / 2; \
639 for(int j = 0; j < mask_w; j++) \
641 if(components == 4) \
643 output_row[j * 4 + 3] = output_row[j * 4 + 3] * mask_row[j] / max; \
647 output_row[j * 3] = output_row[j * 3] * mask_row[j] / max; \
649 output_row[j * 3 + 1] = output_row[j * 3 + 1] * mask_row[j] / max; \
650 output_row[j * 3 + 2] = output_row[j * 3 + 2] * mask_row[j] / max; \
654 output_row[j * 3 + 1] += chroma_offset * (max - mask_row[j]) / max; \
655 output_row[j * 3 + 2] += chroma_offset * (max - mask_row[j]) / max; \
664 //printf("MaskUnit::process_package 1 %d\n", engine->mode);
665 for(int i = ptr->row1; i < ptr->row2; i++)
669 case MASK_MULTIPLY_ALPHA:
670 switch(engine->output->get_color_model())
673 APPLY_MASK_MULTIPLY_ALPHA(unsigned char, 0xff, 3, 0);
676 APPLY_MASK_MULTIPLY_ALPHA(float, 1.0, 3, 0);
679 APPLY_MASK_MULTIPLY_ALPHA(unsigned char, 0xff, 3, 1);
682 APPLY_MASK_MULTIPLY_ALPHA(float, 1.0, 4, 0);
685 APPLY_MASK_MULTIPLY_ALPHA(unsigned char, 0xff, 4, 1);
688 APPLY_MASK_MULTIPLY_ALPHA(unsigned char, 0xff, 4, 0);
691 APPLY_MASK_MULTIPLY_ALPHA(uint16_t, 0xffff, 3, 0);
694 APPLY_MASK_MULTIPLY_ALPHA(uint16_t, 0xffff, 3, 1);
696 case BC_YUVA16161616:
697 APPLY_MASK_MULTIPLY_ALPHA(uint16_t, 0xffff, 4, 1);
699 case BC_RGBA16161616:
700 APPLY_MASK_MULTIPLY_ALPHA(uint16_t, 0xffff, 4, 0);
705 case MASK_SUBTRACT_ALPHA:
706 switch(engine->output->get_color_model())
709 APPLY_MASK_SUBTRACT_ALPHA(unsigned char, 0xff, 3, 0);
712 APPLY_MASK_SUBTRACT_ALPHA(float, 1.0, 3, 0);
715 APPLY_MASK_SUBTRACT_ALPHA(float, 1.0, 4, 0);
718 APPLY_MASK_SUBTRACT_ALPHA(unsigned char, 0xff, 4, 0);
721 APPLY_MASK_SUBTRACT_ALPHA(unsigned char, 0xff, 3, 1);
724 APPLY_MASK_SUBTRACT_ALPHA(unsigned char, 0xff, 4, 1);
727 APPLY_MASK_SUBTRACT_ALPHA(uint16_t, 0xffff, 3, 0);
729 case BC_RGBA16161616:
730 APPLY_MASK_SUBTRACT_ALPHA(uint16_t, 0xffff, 4, 0);
733 APPLY_MASK_SUBTRACT_ALPHA(uint16_t, 0xffff, 3, 1);
735 case BC_YUVA16161616:
736 APPLY_MASK_SUBTRACT_ALPHA(uint16_t, 0xffff, 4, 1);
749 MaskEngine::MaskEngine(int cpus)
750 : LoadServer(cpus, cpus * OVERSAMPLE * 2)
751 // : LoadServer(1, OVERSAMPLE * 2)
756 MaskEngine::~MaskEngine()
763 point_sets.remove_all_objects();
766 int MaskEngine::points_equivalent(ArrayList<MaskPoint*> *new_points,
767 ArrayList<MaskPoint*> *points)
769 //printf("MaskEngine::points_equivalent %d %d\n", new_points->total, points->total);
770 if(new_points->total != points->total) return 0;
772 for(int i = 0; i < new_points->total; i++)
774 if(!(*new_points->values[i] == *points->values[i])) return 0;
780 void MaskEngine::do_mask(VFrame *output,
781 int64_t start_position,
783 double project_frame_rate,
784 MaskAutos *keyframe_set,
787 int64_t start_position_project = (int64_t)(start_position *
791 MaskAuto *default_auto = (MaskAuto*)keyframe_set->default_auto;
792 MaskAuto *keyframe = (MaskAuto*)keyframe_set->get_prev_auto(start_position_project,
797 int total_points = 0;
798 for(int i = 0; i < keyframe->masks.total; i++)
800 SubMask *mask = keyframe->get_submask(i);
801 int submask_points = mask->points.total;
802 if(submask_points > 1) total_points += submask_points;
805 //printf("MaskEngine::do_mask 1 %d %d\n", total_points, keyframe->value);
806 // Ignore certain masks
807 if(total_points < 2 ||
808 (keyframe->value == 0 && default_auto->mode == MASK_SUBTRACT_ALPHA))
813 // Fake certain masks
814 if(keyframe->value == 0 && default_auto->mode == MASK_MULTIPLY_ALPHA)
816 output->clear_frame();
820 //printf("MaskEngine::do_mask 1\n");
822 int new_color_model = 0;
824 switch(output->get_color_model())
828 new_color_model = BC_A_FLOAT;
835 new_color_model = BC_A8;
839 case BC_RGBA16161616:
841 case BC_YUVA16161616:
842 new_color_model = BC_A16;
846 // Determine if recalculation is needed
849 (mask->get_w() != output->get_w() ||
850 mask->get_h() != output->get_h() ||
851 mask->get_color_model() != new_color_model))
861 if(point_sets.total != keyframe_set->total_submasks(start_position_project,
869 i < keyframe_set->total_submasks(start_position_project,
870 direction) && !recalculate;
873 ArrayList<MaskPoint*> *new_points = new ArrayList<MaskPoint*>;
874 keyframe_set->get_points(new_points,
876 start_position_project,
878 if(!points_equivalent(new_points, point_sets.values[i])) recalculate = 1;
879 new_points->remove_all_objects();
884 !EQUIV(keyframe->feather, feather) ||
885 !EQUIV(keyframe->value, value))
894 temp_mask = new VFrame(0,
899 if(keyframe->feather > 0)
900 temp_mask->clear_frame();
903 point_sets.remove_all_objects();
906 i < keyframe_set->total_submasks(start_position_project,
910 ArrayList<MaskPoint*> *new_points = new ArrayList<MaskPoint*>;
911 keyframe_set->get_points(new_points,
913 start_position_project,
915 point_sets.append(new_points);
921 this->output = output;
922 this->mode = default_auto->mode;
923 this->feather = keyframe->feather;
924 this->value = keyframe->value;
933 void MaskEngine::init_packages()
935 //printf("MaskEngine::init_packages 1\n");
936 int division = (int)((float)output->get_h() / (total_packages / 2) + 0.5);
937 if(division < 1) division = 1;
939 // Always a multiple of 2 packages exist
940 for(int i = 0; i < get_total_packages() / 2; i++)
942 MaskPackage *part1 = (MaskPackage*)packages[i];
943 MaskPackage *part2 = (MaskPackage*)packages[i + total_packages / 2];
944 part2->row1 = part1->row1 = division * i;
945 part2->row2 = part1->row2 = division * i + division;
946 part2->row1 = part1->row1 = MIN(output->get_h(), part1->row1);
947 part2->row2 = part1->row2 = MIN(output->get_h(), part1->row2);
949 if(i >= (total_packages / 2) - 1)
951 part2->row2 = part1->row2 = output->get_h();
954 part2->apply_mutex->lock("MaskEngine::init_packages");
956 part1->part = RECALCULATE_PART;
957 part2->part = APPLY_PART;
959 //printf("MaskEngine::init_packages 2\n");
962 LoadClient* MaskEngine::new_client()
964 return new MaskUnit(this);
967 LoadPackage* MaskEngine::new_package()
969 return new MaskPackage;