+
+ Phase *phase = new Phase;
+ phase->glsl_program_num = glsl_program_num;
+ phase->input_needs_mipmaps = input_needs_mipmaps;
+ phase->inputs = true_inputs;
+ phase->effects = effects;
+
+ return phase;
+}
+
+// Construct GLSL programs, starting at the given effect and following
+// the chain from there. We end a program every time we come to an effect
+// marked as "needs texture bounce", one that is used by multiple other
+// effects, every time an effect wants to change the output size,
+// and of course at the end.
+//
+// We follow a quite simple depth-first search from the output, although
+// without any explicit recursion.
+void EffectChain::construct_glsl_programs(Node *output)
+{
+ // Which effects have already been completed in this phase?
+ // We need to keep track of it, as an effect with multiple outputs
+ // could otherwise be calculate multiple times.
+ std::set<Node *> completed_effects;
+
+ // Effects in the current phase, as well as inputs (outputs from other phases
+ // that we depend on). Note that since we start iterating from the end,
+ // the effect list will be in the reverse order.
+ std::vector<Node *> this_phase_inputs;
+ std::vector<Node *> this_phase_effects;
+
+ // Effects that we have yet to calculate, but that we know should
+ // be in the current phase.
+ std::stack<Node *> effects_todo_this_phase;
+
+ // Effects that we have yet to calculate, but that come from other phases.
+ // We delay these until we have this phase done in its entirety,
+ // at which point we pick any of them and start a new phase from that.
+ std::stack<Node *> effects_todo_other_phases;
+
+ effects_todo_this_phase.push(output);
+
+ for ( ;; ) { // Termination condition within loop.
+ if (!effects_todo_this_phase.empty()) {
+ // OK, we have more to do this phase.
+ Node *node = effects_todo_this_phase.top();
+ effects_todo_this_phase.pop();
+
+ // This should currently only happen for effects that are phase outputs,
+ // and we throw those out separately below.
+ assert(completed_effects.count(node) == 0);
+
+ this_phase_effects.push_back(node);
+ completed_effects.insert(node);
+
+ // Find all the dependencies of this effect, and add them to the stack.
+ std::vector<Node *> deps = node->incoming_links;
+ assert(node->effect->num_inputs() == deps.size());
+ for (unsigned i = 0; i < deps.size(); ++i) {
+ bool start_new_phase = false;
+
+ // FIXME: If we sample directly from a texture, we won't need this.
+ if (node->effect->needs_texture_bounce()) {
+ start_new_phase = true;
+ }
+
+ if (deps[i]->outgoing_links.size() > 1 && deps[i]->effect->num_inputs() > 0) {
+ // More than one effect uses this as the input,
+ // and it is not a texture itself.
+ // The easiest thing to do (and probably also the safest
+ // performance-wise in most cases) is to bounce it to a texture
+ // and then let the next passes read from that.
+ start_new_phase = true;
+ }
+
+ if (deps[i]->effect->changes_output_size()) {
+ start_new_phase = true;
+ }
+
+ if (start_new_phase) {
+ effects_todo_other_phases.push(deps[i]);
+ this_phase_inputs.push_back(deps[i]);
+ } else {
+ effects_todo_this_phase.push(deps[i]);
+ }
+ }
+ continue;
+ }
+
+ // No more effects to do this phase. Take all the ones we have,
+ // and create a GLSL program for it.
+ if (!this_phase_effects.empty()) {
+ reverse(this_phase_effects.begin(), this_phase_effects.end());
+ phases.push_back(compile_glsl_program(this_phase_inputs, this_phase_effects));
+ this_phase_effects.back()->phase = phases.back();
+ this_phase_inputs.clear();
+ this_phase_effects.clear();
+ }
+ assert(this_phase_inputs.empty());
+ assert(this_phase_effects.empty());
+
+ // If we have no effects left, exit.
+ if (effects_todo_other_phases.empty()) {
+ break;
+ }
+
+ Node *node = effects_todo_other_phases.top();
+ effects_todo_other_phases.pop();
+
+ if (completed_effects.count(node) == 0) {
+ // Start a new phase, calculating from this effect.
+ effects_todo_this_phase.push(node);
+ }
+ }
+
+ // Finally, since the phases are found from the output but must be executed
+ // from the input(s), reverse them, too.
+ std::reverse(phases.begin(), phases.end());
+}
+
+void EffectChain::output_dot(const char *filename)
+{
+ FILE *fp = fopen(filename, "w");
+ if (fp == NULL) {
+ perror(filename);
+ exit(1);
+ }
+
+ fprintf(fp, "digraph G {\n");
+ for (unsigned i = 0; i < nodes.size(); ++i) {
+ fprintf(fp, " n%ld [label=\"%s\"];\n", (long)nodes[i], nodes[i]->effect->effect_type_id().c_str());
+ for (unsigned j = 0; j < nodes[i]->outgoing_links.size(); ++j) {
+ std::vector<std::string> labels;
+
+ if (nodes[i]->outgoing_links[j]->effect->needs_texture_bounce()) {
+ labels.push_back("needs_bounce");
+ }
+ if (nodes[i]->effect->changes_output_size()) {
+ labels.push_back("resize");
+ }
+
+ switch (nodes[i]->output_color_space) {
+ case COLORSPACE_REC_709:
+ labels.push_back("spc[rec709]");
+ break;
+ case COLORSPACE_REC_601_525:
+ labels.push_back("spc[rec601-525]");
+ break;
+ case COLORSPACE_REC_601_625:
+ labels.push_back("spc[rec601-625]");
+ break;
+ default:
+ break;
+ }
+
+ switch (nodes[i]->output_gamma_curve) {
+ case GAMMA_sRGB:
+ labels.push_back("gamma[sRGB]");
+ break;
+ case GAMMA_REC_601: // and GAMMA_REC_709
+ labels.push_back("gamma[rec601/709]");
+ break;
+ default:
+ break;
+ }
+
+ if (labels.empty()) {
+ fprintf(fp, " n%ld -> n%ld;\n", (long)nodes[i], (long)nodes[i]->outgoing_links[j]);
+ } else {
+ std::string label = labels[0];
+ for (unsigned k = 1; k < labels.size(); ++k) {
+ label += ", " + labels[k];
+ }
+ fprintf(fp, " n%ld -> n%ld [label=\"%s\"];\n", (long)nodes[i], (long)nodes[i]->outgoing_links[j], label.c_str());
+ }
+ }
+ }
+ fprintf(fp, "}\n");
+
+ fclose(fp);
+}
+
+void EffectChain::find_output_size(Phase *phase)
+{
+ Node *output_node = phase->effects.back();
+
+ // If the last effect explicitly sets an output size,
+ // use that.
+ if (output_node->effect->changes_output_size()) {
+ output_node->effect->get_output_size(&phase->output_width, &phase->output_height);
+ return;
+ }
+
+ // If not, look at the input phases, if any. We select the largest one
+ // (really assuming they all have the same aspect currently), by pixel count.
+ if (!phase->inputs.empty()) {
+ unsigned best_width = 0, best_height = 0;
+ for (unsigned i = 0; i < phase->inputs.size(); ++i) {
+ Node *input = phase->inputs[i];
+ assert(input->phase->output_width != 0);
+ assert(input->phase->output_height != 0);
+ if (input->phase->output_width * input->phase->output_height > best_width * best_height) {
+ best_width = input->phase->output_width;
+ best_height = input->phase->output_height;
+ }
+ }
+ assert(best_width != 0);
+ assert(best_height != 0);
+ phase->output_width = best_width;
+ phase->output_height = best_height;
+ return;
+ }
+
+ // OK, no inputs. Just use the global width/height.
+ // TODO: We probably want to use the texture's size eventually.
+ phase->output_width = width;
+ phase->output_height = height;
+}
+
+void EffectChain::finalize()
+{
+ output_dot("final.dot");
+
+ // Find the output effect. This is, simply, one that has no outgoing links.
+ // If there are multiple ones, the graph is malformed (we do not support
+ // multiple outputs right now).
+ std::vector<Node *> output_nodes;
+ for (unsigned i = 0; i < nodes.size(); ++i) {
+ Node *node = nodes[i];
+ if (node->outgoing_links.empty()) {
+ output_nodes.push_back(node);
+ }
+ }
+ assert(output_nodes.size() == 1);
+ Node *output_node = output_nodes[0];
+
+ // Add normalizers to get the output format right.
+ if (output_node->output_color_space != output_format.color_space) {
+ ColorSpaceConversionEffect *colorspace_conversion = new ColorSpaceConversionEffect();
+ colorspace_conversion->set_int("source_space", output_node->output_color_space);
+ colorspace_conversion->set_int("destination_space", output_format.color_space);
+ std::vector<Effect *> inputs;
+ inputs.push_back(output_node->effect);
+ colorspace_conversion->add_self_to_effect_chain(this, inputs);
+
+ assert(node_map.count(colorspace_conversion) != 0);
+ output_node = node_map[colorspace_conversion];
+ output_node->output_color_space = output_format.color_space;
+ }
+ if (output_node->output_gamma_curve != output_format.gamma_curve) {
+ if (output_node->output_gamma_curve != GAMMA_LINEAR) {
+ output_node = normalize_to_linear_gamma(output_node);
+ }
+ GammaCompressionEffect *gamma_conversion = new GammaCompressionEffect();
+ gamma_conversion->set_int("destination_curve", output_format.gamma_curve);
+ std::vector<Effect *> inputs;
+ inputs.push_back(output_node->effect);
+ gamma_conversion->add_self_to_effect_chain(this, inputs);
+
+ assert(node_map.count(gamma_conversion) != 0);
+ output_node = node_map[gamma_conversion];
+ output_node->output_gamma_curve = output_format.gamma_curve;
+ }
+
+ // Construct all needed GLSL programs, starting at the output.
+ construct_glsl_programs(output_node);
+
+ // If we have more than one phase, we need intermediate render-to-texture.
+ // Construct an FBO, and then as many textures as we need.
+ // We choose the simplest option of having one texture per output,
+ // since otherwise this turns into an (albeit simple)
+ // register allocation problem.
+ if (phases.size() > 1) {
+ glGenFramebuffers(1, &fbo);
+
+ for (unsigned i = 0; i < phases.size() - 1; ++i) {
+ find_output_size(phases[i]);
+
+ Node *output_node = phases[i]->effects.back();
+ glGenTextures(1, &output_node->output_texture);
+ check_error();
+ glBindTexture(GL_TEXTURE_2D, output_node->output_texture);
+ check_error();
+ glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_S, GL_CLAMP_TO_EDGE);
+ check_error();
+ glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_WRAP_T, GL_CLAMP_TO_EDGE);
+ check_error();
+ glTexImage2D(GL_TEXTURE_2D, 0, GL_RGBA16F_ARB, phases[i]->output_width, phases[i]->output_height, 0, GL_RGBA, GL_UNSIGNED_BYTE, NULL);
+ check_error();
+
+ output_node->output_texture_width = phases[i]->output_width;
+ output_node->output_texture_height = phases[i]->output_height;
+ }
+ }
+
+ for (unsigned i = 0; i < inputs.size(); ++i) {
+ inputs[i]->finalize();
+ }
+
+ assert(phases[0]->inputs.empty());
+
+ finalized = true;
+}
+
+void EffectChain::render_to_screen()
+{
+ assert(finalized);
+
+ // Basic state.
+ glDisable(GL_BLEND);
+ check_error();
+ glDisable(GL_DEPTH_TEST);
+ check_error();
+ glDepthMask(GL_FALSE);
+ check_error();
+
+ glMatrixMode(GL_PROJECTION);
+ glLoadIdentity();
+ glOrtho(0.0, 1.0, 0.0, 1.0, 0.0, 1.0);
+
+ glMatrixMode(GL_MODELVIEW);
+ glLoadIdentity();
+
+ if (phases.size() > 1) {
+ glBindFramebuffer(GL_FRAMEBUFFER, fbo);
+ check_error();
+ }
+
+ std::set<Node *> generated_mipmaps;
+
+ for (unsigned phase = 0; phase < phases.size(); ++phase) {
+ // See if the requested output size has changed. If so, we need to recreate
+ // the texture (and before we start setting up inputs).
+ if (phase != phases.size() - 1) {
+ find_output_size(phases[phase]);
+
+ Node *output_node = phases[phase]->effects.back();
+
+ if (output_node->output_texture_width != phases[phase]->output_width ||
+ output_node->output_texture_height != phases[phase]->output_height) {
+ glActiveTexture(GL_TEXTURE0);
+ check_error();
+ glBindTexture(GL_TEXTURE_2D, output_node->output_texture);
+ check_error();
+ glTexImage2D(GL_TEXTURE_2D, 0, GL_RGBA16F_ARB, phases[phase]->output_width, phases[phase]->output_height, 0, GL_RGBA, GL_UNSIGNED_BYTE, NULL);
+ check_error();
+ glBindTexture(GL_TEXTURE_2D, 0);
+ check_error();
+
+ output_node->output_texture_width = phases[phase]->output_width;
+ output_node->output_texture_height = phases[phase]->output_height;
+ }
+ }
+
+ glUseProgram(phases[phase]->glsl_program_num);
+ check_error();
+
+ // Set up RTT inputs for this phase.
+ for (unsigned sampler = 0; sampler < phases[phase]->inputs.size(); ++sampler) {
+ glActiveTexture(GL_TEXTURE0 + sampler);
+ Node *input = phases[phase]->inputs[sampler];
+ glBindTexture(GL_TEXTURE_2D, input->output_texture);
+ check_error();
+ if (phases[phase]->input_needs_mipmaps) {
+ if (generated_mipmaps.count(input) == 0) {
+ glGenerateMipmap(GL_TEXTURE_2D);
+ check_error();
+ generated_mipmaps.insert(input);
+ }
+ glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR_MIPMAP_NEAREST);
+ check_error();
+ } else {
+ glTexParameteri(GL_TEXTURE_2D, GL_TEXTURE_MIN_FILTER, GL_LINEAR);
+ check_error();
+ }
+
+ std::string texture_name = std::string("tex_") + input->effect_id;
+ glUniform1i(glGetUniformLocation(phases[phase]->glsl_program_num, texture_name.c_str()), sampler);
+ check_error();
+ }
+
+ // And now the output.
+ if (phase == phases.size() - 1) {
+ // Last phase goes directly to the screen.
+ glBindFramebuffer(GL_FRAMEBUFFER, 0);
+ check_error();
+ glViewport(0, 0, width, height);
+ } else {
+ Node *output_node = phases[phase]->effects.back();
+ glFramebufferTexture2D(
+ GL_FRAMEBUFFER,
+ GL_COLOR_ATTACHMENT0,
+ GL_TEXTURE_2D,
+ output_node->output_texture,
+ 0);
+ check_error();
+ glViewport(0, 0, phases[phase]->output_width, phases[phase]->output_height);
+ }
+
+ // Give the required parameters to all the effects.
+ unsigned sampler_num = phases[phase]->inputs.size();
+ for (unsigned i = 0; i < phases[phase]->effects.size(); ++i) {
+ Node *node = phases[phase]->effects[i];
+ node->effect->set_gl_state(phases[phase]->glsl_program_num, node->effect_id, &sampler_num);
+ check_error();
+ }
+
+ // Now draw!
+ glBegin(GL_QUADS);
+
+ glTexCoord2f(0.0f, 0.0f);
+ glVertex2f(0.0f, 0.0f);
+
+ glTexCoord2f(1.0f, 0.0f);
+ glVertex2f(1.0f, 0.0f);
+
+ glTexCoord2f(1.0f, 1.0f);
+ glVertex2f(1.0f, 1.0f);
+
+ glTexCoord2f(0.0f, 1.0f);
+ glVertex2f(0.0f, 1.0f);
+
+ glEnd();
+ check_error();
+
+ for (unsigned i = 0; i < phases[phase]->effects.size(); ++i) {
+ Node *node = phases[phase]->effects[i];
+ node->effect->clear_gl_state();
+ }
+ }