1dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams/*
2dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * Copyright (C) 2012 The Android Open Source Project
3dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams *
4dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * Licensed under the Apache License, Version 2.0 (the "License");
5dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * you may not use this file except in compliance with the License.
6dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * You may obtain a copy of the License at
7dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams *
8dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams *      http://www.apache.org/licenses/LICENSE-2.0
9dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams *
10dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * Unless required by applicable law or agreed to in writing, software
11dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * distributed under the License is distributed on an "AS IS" BASIS,
12dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * See the License for the specific language governing permissions and
14dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams * limitations under the License.
15dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams */
16dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
171ffd86b448d78366190c540f98f8b6d641cdb6cfYang Ni#include "rsScriptGroup.h"
1893d6bc872b7d9fba63abfa7513d56b38d9c3d371Chris Wailes
19dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams#include "rsContext.h"
20b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni// TODO: Is this header needed here?
211ffd86b448d78366190c540f98f8b6d641cdb6cfYang Ni#include "rsScriptGroup2.h"
221ffd86b448d78366190c540f98f8b6d641cdb6cfYang Ni
231ffd86b448d78366190c540f98f8b6d641cdb6cfYang Ni#include <algorithm>
24dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams#include <time.h>
25dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
2611496ac131bb691edf5bdcab3029dceef5c1e4e1Chih-Hung Hsiehnamespace android {
2711496ac131bb691edf5bdcab3029dceef5c1e4e1Chih-Hung Hsiehnamespace renderscript {
28dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
291ffd86b448d78366190c540f98f8b6d641cdb6cfYang NiScriptGroup::ScriptGroup(Context *rsc) : ScriptGroupBase(rsc) {
30dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
31dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
32dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup::~ScriptGroup() {
33dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    if (mRSC->mHal.funcs.scriptgroup.destroy) {
34dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        mRSC->mHal.funcs.scriptgroup.destroy(mRSC, this);
35dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
36dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
37b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mLinks.size(); ct++) {
38b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        delete mLinks[ct];
39dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
4061d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen
4161d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen    for (auto input : mInputs) {
4261d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen        input->mAlloc.clear();
4361d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen    }
4461d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen
4561d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen    for (auto output : mOutputs) {
4661d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen        output->mAlloc.clear();
4761d5ed595d77cd1eedc0c9dbf563214075946121Yong Chen    }
48dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
49dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
50dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup::IO::IO(const ScriptKernelID *kid) {
51dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    mKernel = kid;
52dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
53dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
54dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup::Node::Node(Script *s) {
55dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    mScript = s;
56dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    mSeen = false;
57dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    mOrder = 0;
58dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
59dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
60dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup::Node * ScriptGroup::findNode(Script *s) const {
61b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    //ALOGE("find %p   %i", s, (int)mNodes.size());
62b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mNodes.size(); ct++) {
63b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Node *n = mNodes[ct];
64b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        for (size_t ct2=0; ct2 < n->mKernels.size(); ct2++) {
65b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            if (n->mKernels[ct2]->mScript == s) {
66b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                return n;
67dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
68dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
69dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
7093d6bc872b7d9fba63abfa7513d56b38d9c3d371Chris Wailes
7144bef6fba6244292b751387f3d6c31cca96c28adChris Wailes    return nullptr;
72dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
73dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
74b8353c5943f4038fd7f08db3d958390ce9418798Yang Nibool ScriptGroup::calcOrderRecurse(Node *n, int depth) {
75b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    n->mSeen = true;
76b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    if (n->mOrder < depth) {
77b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        n->mOrder = depth;
78dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
79dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    bool ret = true;
8093d6bc872b7d9fba63abfa7513d56b38d9c3d371Chris Wailes
81b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < n->mOutputs.size(); ct++) {
82b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        const Link *l = n->mOutputs[ct];
83b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Node *nt = NULL;
84b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (l->mDstField.get()) {
85b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            nt = findNode(l->mDstField->mScript);
86dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        } else {
87b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            nt = findNode(l->mDstKernel->mScript);
88dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
89b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (nt->mSeen) {
90dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            return false;
91dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
92b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        ret &= calcOrderRecurse(nt, n->mOrder + 1);
93dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
9493d6bc872b7d9fba63abfa7513d56b38d9c3d371Chris Wailes    return ret;
95dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
96dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
97b8353c5943f4038fd7f08db3d958390ce9418798Yang Niclass NodeCompare {
98b8353c5943f4038fd7f08db3d958390ce9418798Yang Nipublic:
99b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    bool operator() (const ScriptGroup::Node* lhs,
100b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                     const ScriptGroup::Node* rhs) {
10182e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang        return (lhs->mOrder < rhs->mOrder);
102b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    }
103b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni};
104b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni
105dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsbool ScriptGroup::calcOrder() {
106dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    // Make nodes
10793d6bc872b7d9fba63abfa7513d56b38d9c3d371Chris Wailes
108b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mKernels.size(); ct++) {
109b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        const ScriptKernelID *k = mKernels[ct].get();
110b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        //ALOGE(" kernel %i, %p  s=%p", (int)ct, k, mKernels[ct]->mScript);
111b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Node *n = findNode(k->mScript);
112b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        //ALOGE("    n = %p", n);
113b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (n == NULL) {
114b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            n = new Node(k->mScript);
11582e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang            mNodes.push_back(n);
116dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
11782e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang        n->mKernels.push_back(k);
118dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
119dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
120dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    // add links
121b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    //ALOGE("link count %i", (int)mLinks.size());
122b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mLinks.size(); ct++) {
123b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Link *l = mLinks[ct];
124b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        //ALOGE("link  %i %p", (int)ct, l);
125b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Node *n = findNode(l->mSource->mScript);
126b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        //ALOGE("link n %p", n);
12782e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang        n->mOutputs.push_back(l);
128b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni
129b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (l->mDstKernel.get()) {
130b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            //ALOGE("l->mDstKernel.get() %p", l->mDstKernel.get());
131b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            n = findNode(l->mDstKernel->mScript);
132b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            //ALOGE("  n1 %p", n);
13382e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang            n->mInputs.push_back(l);
134dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        } else {
135b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            n = findNode(l->mDstField->mScript);
136b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            //ALOGE("  n2 %p", n);
13782e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang            n->mInputs.push_back(l);
138dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
139dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
140dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
141b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    //ALOGE("node count %i", (int)mNodes.size());
142dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    // Order nodes
143dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    bool ret = true;
144b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mNodes.size(); ct++) {
145b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Node *n = mNodes[ct];
146b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (n->mInputs.size() == 0) {
147b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct2=0; ct2 < mNodes.size(); ct2++) {
148b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                mNodes[ct2]->mSeen = false;
149dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
150b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            ret &= calcOrderRecurse(n, 0);
151dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
152dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
153dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
154b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mKernels.size(); ct++) {
155b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        const ScriptKernelID *k = mKernels[ct].get();
156b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        const Node *n = findNode(k->mScript);
157dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
158b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (k->mHasKernelOutput) {
159dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            bool found = false;
160b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct2=0; ct2 < n->mOutputs.size(); ct2++) {
161b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                if (n->mOutputs[ct2]->mSource.get() == k) {
162dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                    found = true;
163dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                    break;
164dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
165dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
166dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            if (!found) {
167b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                //ALOGE("add io out %p", k);
16882e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang                mOutputs.push_back(new IO(k));
169dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
170dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
171dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
172b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (k->mHasKernelInput) {
173dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            bool found = false;
174b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct2=0; ct2 < n->mInputs.size(); ct2++) {
175b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                if (n->mInputs[ct2]->mDstKernel.get() == k) {
176dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                    found = true;
177dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                    break;
178dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
179dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
180dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            if (!found) {
181b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                //ALOGE("add io in %p", k);
18282e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang                mInputs.push_back(new IO(k));
183dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
184dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
185dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
186dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
18782e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang    // Sort mNodes in the increasing order.
188b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    std::sort(mNodes.begin(), mNodes.end(), NodeCompare());
189dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    return ret;
190dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
191dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
192dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup * ScriptGroup::create(Context *rsc,
193dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           ScriptKernelID ** kernels, size_t kernelsSize,
194dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           ScriptKernelID ** src, size_t srcSize,
195dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           ScriptKernelID ** dstK, size_t dstKSize,
196dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           ScriptFieldID  ** dstF, size_t dstFSize,
197dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           const Type ** type, size_t typeSize) {
198dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
199dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    size_t kernelCount = kernelsSize / sizeof(ScriptKernelID *);
200dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    size_t linkCount = typeSize / sizeof(Type *);
201dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
202dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    //ALOGE("ScriptGroup::create kernels=%i  links=%i", (int)kernelCount, (int)linkCount);
203dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
204dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
205dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    // Start by counting unique kernel sources
206dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
207dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    ScriptGroup *sg = new ScriptGroup(rsc);
208dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
209dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    sg->mKernels.reserve(kernelCount);
210dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    for (size_t ct=0; ct < kernelCount; ct++) {
21182e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang        sg->mKernels.push_back(kernels[ct]);
212dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
213dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
214dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    sg->mLinks.reserve(linkCount);
215dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    for (size_t ct=0; ct < linkCount; ct++) {
216dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        Link *l = new Link();
217dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        l->mType = type[ct];
218dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        l->mSource = src[ct];
219dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        l->mDstField = dstF[ct];
220dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        l->mDstKernel = dstK[ct];
22182e135c4bbe18855d8ed02632bb074f8da0b96e0Miao Wang        sg->mLinks.push_back(l);
222dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
223dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
224dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    sg->calcOrder();
225dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
226dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    // allocate links
227dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    for (size_t ct=0; ct < sg->mNodes.size(); ct++) {
228dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        const Node *n = sg->mNodes[ct];
229dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        for (size_t ct2=0; ct2 < n->mOutputs.size(); ct2++) {
230dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            Link *l = n->mOutputs[ct2];
231dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            if (l->mAlloc.get()) {
232dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                continue;
233dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
234dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            Allocation * alloc = Allocation::createAllocation(rsc,
235dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                    l->mType.get(), RS_ALLOCATION_USAGE_SCRIPT);
236dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            l->mAlloc = alloc;
237dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
238dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            for (size_t ct3=ct2+1; ct3 < n->mOutputs.size(); ct3++) {
239dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                if (n->mOutputs[ct3]->mSource.get() == l->mSource.get()) {
240dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                    n->mOutputs[ct3]->mAlloc = alloc;
241dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
242dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
243dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
244dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
245dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
246dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    if (rsc->mHal.funcs.scriptgroup.init) {
247dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        rsc->mHal.funcs.scriptgroup.init(rsc, sg);
248dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
24961c86951f6a1192fafc536aee613beb6f899064bStephen Hines    sg->incUserRef();
250dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    return sg;
251dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
252dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
253dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsvoid ScriptGroup::setInput(Context *rsc, ScriptKernelID *kid, Allocation *a) {
254b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mInputs.size(); ct++) {
255b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (mInputs[ct]->mKernel == kid) {
256b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            mInputs[ct]->mAlloc = a;
257dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
258dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            if (rsc->mHal.funcs.scriptgroup.setInput) {
259dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                rsc->mHal.funcs.scriptgroup.setInput(rsc, this, kid, a);
260dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
261dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            return;
262dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
263dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
264dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    rsAssert(!"ScriptGroup:setInput kid not found");
265dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
266dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
267dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsvoid ScriptGroup::setOutput(Context *rsc, ScriptKernelID *kid, Allocation *a) {
268b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mOutputs.size(); ct++) {
269b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        if (mOutputs[ct]->mKernel == kid) {
270b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            mOutputs[ct]->mAlloc = a;
271dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
272dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            if (rsc->mHal.funcs.scriptgroup.setOutput) {
273dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                rsc->mHal.funcs.scriptgroup.setOutput(rsc, this, kid, a);
274dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
275dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            return;
276dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
277dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
278dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    rsAssert(!"ScriptGroup:setOutput kid not found");
279dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
280dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
2815f6f16fe612e1c30732becc66205500994889ac9Yang Nibool ScriptGroup::validateInputAndOutput(Context *rsc) {
2825f6f16fe612e1c30732becc66205500994889ac9Yang Ni    for(size_t i = 0; i < mInputs.size(); i++) {
28344bef6fba6244292b751387f3d6c31cca96c28adChris Wailes        if (mInputs[i]->mAlloc.get() == nullptr) {
2845f6f16fe612e1c30732becc66205500994889ac9Yang Ni            rsc->setError(RS_ERROR_BAD_VALUE, "ScriptGroup missing input.");
2855f6f16fe612e1c30732becc66205500994889ac9Yang Ni            return false;
2865f6f16fe612e1c30732becc66205500994889ac9Yang Ni        }
2875f6f16fe612e1c30732becc66205500994889ac9Yang Ni    }
2885f6f16fe612e1c30732becc66205500994889ac9Yang Ni
2895f6f16fe612e1c30732becc66205500994889ac9Yang Ni    for(size_t i = 0; i < mOutputs.size(); i++) {
29044bef6fba6244292b751387f3d6c31cca96c28adChris Wailes        if (mOutputs[i]->mAlloc.get() == nullptr) {
2915f6f16fe612e1c30732becc66205500994889ac9Yang Ni            rsc->setError(RS_ERROR_BAD_VALUE, "ScriptGroup missing output.");
2925f6f16fe612e1c30732becc66205500994889ac9Yang Ni            return false;
2935f6f16fe612e1c30732becc66205500994889ac9Yang Ni        }
2945f6f16fe612e1c30732becc66205500994889ac9Yang Ni    }
2955f6f16fe612e1c30732becc66205500994889ac9Yang Ni
2965f6f16fe612e1c30732becc66205500994889ac9Yang Ni    return true;
2975f6f16fe612e1c30732becc66205500994889ac9Yang Ni}
2985f6f16fe612e1c30732becc66205500994889ac9Yang Ni
299dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsvoid ScriptGroup::execute(Context *rsc) {
3005f6f16fe612e1c30732becc66205500994889ac9Yang Ni    if (!validateInputAndOutput(rsc)) {
3015f6f16fe612e1c30732becc66205500994889ac9Yang Ni        return;
3025f6f16fe612e1c30732becc66205500994889ac9Yang Ni    }
3035f6f16fe612e1c30732becc66205500994889ac9Yang Ni
304dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    if (rsc->mHal.funcs.scriptgroup.execute) {
305dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        rsc->mHal.funcs.scriptgroup.execute(rsc, this);
306dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        return;
307dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
308dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
309b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    for (size_t ct=0; ct < mNodes.size(); ct++) {
310b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        Node *n = mNodes[ct];
311b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        //ALOGE("node %i, order %i, in %i out %i", (int)ct, n->mOrder, (int)n->mInputs.size(), (int)n->mOutputs.size());
312dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
313b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni        for (size_t ct2=0; ct2 < n->mKernels.size(); ct2++) {
314b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            const ScriptKernelID *k = n->mKernels[ct2];
315b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            Allocation *ain = NULL;
316b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            Allocation *aout = NULL;
317b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni
318b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct3=0; ct3 < n->mInputs.size(); ct3++) {
319b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                if (n->mInputs[ct3]->mDstKernel.get() == k) {
320b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    ain = n->mInputs[ct3]->mAlloc.get();
321b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    //ALOGE(" link in %p", ain);
322dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
323dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
324b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct3=0; ct3 < mInputs.size(); ct3++) {
325b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                if (mInputs[ct3]->mKernel == k) {
326b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    ain = mInputs[ct3]->mAlloc.get();
327b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    //ALOGE(" io in %p", ain);
328dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
329dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
330dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
331b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct3=0; ct3 < n->mOutputs.size(); ct3++) {
332b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                if (n->mOutputs[ct3]->mSource.get() == k) {
333b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    aout = n->mOutputs[ct3]->mAlloc.get();
334b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    //ALOGE(" link out %p", aout);
335dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
336dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
337b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            for (size_t ct3=0; ct3 < mOutputs.size(); ct3++) {
338b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                if (mOutputs[ct3]->mKernel == k) {
339b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    aout = mOutputs[ct3]->mAlloc.get();
340b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                    //ALOGE(" io out %p", aout);
341dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                }
342dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams            }
343dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
344b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni            if (ain == NULL) {
345b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                n->mScript->runForEach(rsc, k->mSlot, NULL, 0, aout, NULL, 0);
346b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni
347f37121300217d3b39ab66dd9c8881bcbcad932dfChris Wailes            } else {
348f37121300217d3b39ab66dd9c8881bcbcad932dfChris Wailes                const Allocation *ains[1] = {ain};
349b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                n->mScript->runForEach(rsc, k->mSlot, ains,
350b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                                       sizeof(ains) / sizeof(RsAllocation),
351b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni                                       aout, NULL, 0);
352f37121300217d3b39ab66dd9c8881bcbcad932dfChris Wailes            }
353dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        }
354b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni
355dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    }
356dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
357dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
358dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
359dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup::Link::Link() {
360dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
361dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
362dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsScriptGroup::Link::~Link() {
363dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
364dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
365dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
366dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason SamsRsScriptGroup rsi_ScriptGroupCreate(Context *rsc,
367dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           RsScriptKernelID * kernels, size_t kernelsSize,
368dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           RsScriptKernelID * src, size_t srcSize,
369dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           RsScriptKernelID * dstK, size_t dstKSize,
370dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           RsScriptFieldID * dstF, size_t dstFSize,
371dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                           const RsType * type, size_t typeSize) {
372dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
373dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
374dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    return ScriptGroup::create(rsc,
375dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                               (ScriptKernelID **) kernels, kernelsSize,
376dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                               (ScriptKernelID **) src, srcSize,
377dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                               (ScriptKernelID **) dstK, dstKSize,
378dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                               (ScriptFieldID  **) dstF, dstFSize,
379dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams                               (const Type **) type, typeSize);
380dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
381dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
382dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
383dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsvoid rsi_ScriptGroupSetInput(Context *rsc, RsScriptGroup sg, RsScriptKernelID kid,
384dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        RsAllocation alloc) {
385b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    //ALOGE("rsi_ScriptGroupSetInput");
386dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    ScriptGroup *s = (ScriptGroup *)sg;
387dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    s->setInput(rsc, (ScriptKernelID *)kid, (Allocation *)alloc);
388dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
389dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
390dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsvoid rsi_ScriptGroupSetOutput(Context *rsc, RsScriptGroup sg, RsScriptKernelID kid,
391dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams        RsAllocation alloc) {
392b8353c5943f4038fd7f08db3d958390ce9418798Yang Ni    //ALOGE("rsi_ScriptGroupSetOutput");
393dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    ScriptGroup *s = (ScriptGroup *)sg;
394dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    s->setOutput(rsc, (ScriptKernelID *)kid, (Allocation *)alloc);
395dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
396dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
397dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Samsvoid rsi_ScriptGroupExecute(Context *rsc, RsScriptGroup sg) {
3981ffd86b448d78366190c540f98f8b6d641cdb6cfYang Ni    ScriptGroupBase *s = (ScriptGroupBase *)sg;
399dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams    s->execute(rsc);
400dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams}
401dbe66d6783c1e53cd1572de0ef6ef6fdf6f76f48Jason Sams
40211496ac131bb691edf5bdcab3029dceef5c1e4e1Chih-Hung Hsieh} // namespace renderscript
40311496ac131bb691edf5bdcab3029dceef5c1e4e1Chih-Hung Hsieh} // namespace android
404