Home | History | Annotate | Download | only in rs
      1 /*
      2  * Copyright (C) 2012 The Android Open Source Project
      3  *
      4  * Licensed under the Apache License, Version 2.0 (the "License");
      5  * you may not use this file except in compliance with the License.
      6  * You may obtain a copy of the License at
      7  *
      8  *      http://www.apache.org/licenses/LICENSE-2.0
      9  *
     10  * Unless required by applicable law or agreed to in writing, software
     11  * distributed under the License is distributed on an "AS IS" BASIS,
     12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     13  * See the License for the specific language governing permissions and
     14  * limitations under the License.
     15  */
     16 
     17 #include "rsScriptGroup.h"
     18 
     19 #include "rsContext.h"
     20 // TODO: Is this header needed here?
     21 #include "rsScriptGroup2.h"
     22 
     23 #include <algorithm>
     24 #include <time.h>
     25 
     26 using namespace android;
     27 using namespace android::renderscript;
     28 
     29 ScriptGroup::ScriptGroup(Context *rsc) : ScriptGroupBase(rsc) {
     30 }
     31 
     32 ScriptGroup::~ScriptGroup() {
     33     if (mRSC->mHal.funcs.scriptgroup.destroy) {
     34         mRSC->mHal.funcs.scriptgroup.destroy(mRSC, this);
     35     }
     36 
     37     for (size_t ct=0; ct < mLinks.size(); ct++) {
     38         delete mLinks[ct];
     39     }
     40 
     41     for (auto input : mInputs) {
     42         input->mAlloc.clear();
     43     }
     44 
     45     for (auto output : mOutputs) {
     46         output->mAlloc.clear();
     47     }
     48 }
     49 
     50 ScriptGroup::IO::IO(const ScriptKernelID *kid) {
     51     mKernel = kid;
     52 }
     53 
     54 ScriptGroup::Node::Node(Script *s) {
     55     mScript = s;
     56     mSeen = false;
     57     mOrder = 0;
     58 }
     59 
     60 ScriptGroup::Node * ScriptGroup::findNode(Script *s) const {
     61     //ALOGE("find %p   %i", s, (int)mNodes.size());
     62     for (size_t ct=0; ct < mNodes.size(); ct++) {
     63         Node *n = mNodes[ct];
     64         for (size_t ct2=0; ct2 < n->mKernels.size(); ct2++) {
     65             if (n->mKernels[ct2]->mScript == s) {
     66                 return n;
     67             }
     68         }
     69     }
     70 
     71     return nullptr;
     72 }
     73 
     74 bool ScriptGroup::calcOrderRecurse(Node *n, int depth) {
     75     n->mSeen = true;
     76     if (n->mOrder < depth) {
     77         n->mOrder = depth;
     78     }
     79     bool ret = true;
     80 
     81     for (size_t ct=0; ct < n->mOutputs.size(); ct++) {
     82         const Link *l = n->mOutputs[ct];
     83         Node *nt = NULL;
     84         if (l->mDstField.get()) {
     85             nt = findNode(l->mDstField->mScript);
     86         } else {
     87             nt = findNode(l->mDstKernel->mScript);
     88         }
     89         if (nt->mSeen) {
     90             return false;
     91         }
     92         ret &= calcOrderRecurse(nt, n->mOrder + 1);
     93     }
     94     return ret;
     95 }
     96 
     97 #if !defined(RS_SERVER) && !defined(RS_COMPATIBILITY_LIB)
     98 static int CompareNodeForSort(ScriptGroup::Node *const* lhs,
     99                               ScriptGroup::Node *const* rhs) {
    100     if (lhs[0]->mOrder > rhs[0]->mOrder) {
    101         return 1;
    102     }
    103     return 0;
    104 }
    105 #else
    106 class NodeCompare {
    107 public:
    108     bool operator() (const ScriptGroup::Node* lhs,
    109                      const ScriptGroup::Node* rhs) {
    110         if (lhs->mOrder > rhs->mOrder) {
    111             return true;
    112         }
    113         return false;
    114     }
    115 };
    116 #endif
    117 
    118 bool ScriptGroup::calcOrder() {
    119     // Make nodes
    120 
    121     for (size_t ct=0; ct < mKernels.size(); ct++) {
    122         const ScriptKernelID *k = mKernels[ct].get();
    123         //ALOGE(" kernel %i, %p  s=%p", (int)ct, k, mKernels[ct]->mScript);
    124         Node *n = findNode(k->mScript);
    125         //ALOGE("    n = %p", n);
    126         if (n == NULL) {
    127             n = new Node(k->mScript);
    128             mNodes.add(n);
    129         }
    130         n->mKernels.add(k);
    131     }
    132 
    133     // add links
    134     //ALOGE("link count %i", (int)mLinks.size());
    135     for (size_t ct=0; ct < mLinks.size(); ct++) {
    136         Link *l = mLinks[ct];
    137         //ALOGE("link  %i %p", (int)ct, l);
    138         Node *n = findNode(l->mSource->mScript);
    139         //ALOGE("link n %p", n);
    140         n->mOutputs.add(l);
    141 
    142         if (l->mDstKernel.get()) {
    143             //ALOGE("l->mDstKernel.get() %p", l->mDstKernel.get());
    144             n = findNode(l->mDstKernel->mScript);
    145             //ALOGE("  n1 %p", n);
    146             n->mInputs.add(l);
    147         } else {
    148             n = findNode(l->mDstField->mScript);
    149             //ALOGE("  n2 %p", n);
    150             n->mInputs.add(l);
    151         }
    152     }
    153 
    154     //ALOGE("node count %i", (int)mNodes.size());
    155     // Order nodes
    156     bool ret = true;
    157     for (size_t ct=0; ct < mNodes.size(); ct++) {
    158         Node *n = mNodes[ct];
    159         if (n->mInputs.size() == 0) {
    160             for (size_t ct2=0; ct2 < mNodes.size(); ct2++) {
    161                 mNodes[ct2]->mSeen = false;
    162             }
    163             ret &= calcOrderRecurse(n, 0);
    164         }
    165     }
    166 
    167     for (size_t ct=0; ct < mKernels.size(); ct++) {
    168         const ScriptKernelID *k = mKernels[ct].get();
    169         const Node *n = findNode(k->mScript);
    170 
    171         if (k->mHasKernelOutput) {
    172             bool found = false;
    173             for (size_t ct2=0; ct2 < n->mOutputs.size(); ct2++) {
    174                 if (n->mOutputs[ct2]->mSource.get() == k) {
    175                     found = true;
    176                     break;
    177                 }
    178             }
    179             if (!found) {
    180                 //ALOGE("add io out %p", k);
    181                 mOutputs.add(new IO(k));
    182             }
    183         }
    184 
    185         if (k->mHasKernelInput) {
    186             bool found = false;
    187             for (size_t ct2=0; ct2 < n->mInputs.size(); ct2++) {
    188                 if (n->mInputs[ct2]->mDstKernel.get() == k) {
    189                     found = true;
    190                     break;
    191                 }
    192             }
    193             if (!found) {
    194                 //ALOGE("add io in %p", k);
    195                 mInputs.add(new IO(k));
    196             }
    197         }
    198     }
    199 
    200     // sort
    201 #if !defined(RS_SERVER) && !defined(RS_COMPATIBILITY_LIB)
    202     mNodes.sort(&CompareNodeForSort);
    203 #else
    204     std::sort(mNodes.begin(), mNodes.end(), NodeCompare());
    205 #endif
    206 
    207     return ret;
    208 }
    209 
    210 ScriptGroup * ScriptGroup::create(Context *rsc,
    211                            ScriptKernelID ** kernels, size_t kernelsSize,
    212                            ScriptKernelID ** src, size_t srcSize,
    213                            ScriptKernelID ** dstK, size_t dstKSize,
    214                            ScriptFieldID  ** dstF, size_t dstFSize,
    215                            const Type ** type, size_t typeSize) {
    216 
    217     size_t kernelCount = kernelsSize / sizeof(ScriptKernelID *);
    218     size_t linkCount = typeSize / sizeof(Type *);
    219 
    220     //ALOGE("ScriptGroup::create kernels=%i  links=%i", (int)kernelCount, (int)linkCount);
    221 
    222 
    223     // Start by counting unique kernel sources
    224 
    225     ScriptGroup *sg = new ScriptGroup(rsc);
    226 
    227     sg->mKernels.reserve(kernelCount);
    228     for (size_t ct=0; ct < kernelCount; ct++) {
    229         sg->mKernels.add(kernels[ct]);
    230     }
    231 
    232     sg->mLinks.reserve(linkCount);
    233     for (size_t ct=0; ct < linkCount; ct++) {
    234         Link *l = new Link();
    235         l->mType = type[ct];
    236         l->mSource = src[ct];
    237         l->mDstField = dstF[ct];
    238         l->mDstKernel = dstK[ct];
    239         sg->mLinks.add(l);
    240     }
    241 
    242     sg->calcOrder();
    243 
    244     // allocate links
    245     for (size_t ct=0; ct < sg->mNodes.size(); ct++) {
    246         const Node *n = sg->mNodes[ct];
    247         for (size_t ct2=0; ct2 < n->mOutputs.size(); ct2++) {
    248             Link *l = n->mOutputs[ct2];
    249             if (l->mAlloc.get()) {
    250                 continue;
    251             }
    252             const ScriptKernelID *k = l->mSource.get();
    253 
    254             Allocation * alloc = Allocation::createAllocation(rsc,
    255                     l->mType.get(), RS_ALLOCATION_USAGE_SCRIPT);
    256             l->mAlloc = alloc;
    257 
    258             for (size_t ct3=ct2+1; ct3 < n->mOutputs.size(); ct3++) {
    259                 if (n->mOutputs[ct3]->mSource.get() == l->mSource.get()) {
    260                     n->mOutputs[ct3]->mAlloc = alloc;
    261                 }
    262             }
    263         }
    264     }
    265 
    266     if (rsc->mHal.funcs.scriptgroup.init) {
    267         rsc->mHal.funcs.scriptgroup.init(rsc, sg);
    268     }
    269     sg->incUserRef();
    270     return sg;
    271 }
    272 
    273 void ScriptGroup::setInput(Context *rsc, ScriptKernelID *kid, Allocation *a) {
    274     for (size_t ct=0; ct < mInputs.size(); ct++) {
    275         if (mInputs[ct]->mKernel == kid) {
    276             mInputs[ct]->mAlloc = a;
    277 
    278             if (rsc->mHal.funcs.scriptgroup.setInput) {
    279                 rsc->mHal.funcs.scriptgroup.setInput(rsc, this, kid, a);
    280             }
    281             return;
    282         }
    283     }
    284     rsAssert(!"ScriptGroup:setInput kid not found");
    285 }
    286 
    287 void ScriptGroup::setOutput(Context *rsc, ScriptKernelID *kid, Allocation *a) {
    288     for (size_t ct=0; ct < mOutputs.size(); ct++) {
    289         if (mOutputs[ct]->mKernel == kid) {
    290             mOutputs[ct]->mAlloc = a;
    291 
    292             if (rsc->mHal.funcs.scriptgroup.setOutput) {
    293                 rsc->mHal.funcs.scriptgroup.setOutput(rsc, this, kid, a);
    294             }
    295             return;
    296         }
    297     }
    298     rsAssert(!"ScriptGroup:setOutput kid not found");
    299 }
    300 
    301 bool ScriptGroup::validateInputAndOutput(Context *rsc) {
    302     for(size_t i = 0; i < mInputs.size(); i++) {
    303         if (mInputs[i]->mAlloc.get() == nullptr) {
    304             rsc->setError(RS_ERROR_BAD_VALUE, "ScriptGroup missing input.");
    305             return false;
    306         }
    307     }
    308 
    309     for(size_t i = 0; i < mOutputs.size(); i++) {
    310         if (mOutputs[i]->mAlloc.get() == nullptr) {
    311             rsc->setError(RS_ERROR_BAD_VALUE, "ScriptGroup missing output.");
    312             return false;
    313         }
    314     }
    315 
    316     return true;
    317 }
    318 
    319 void ScriptGroup::execute(Context *rsc) {
    320     if (!validateInputAndOutput(rsc)) {
    321         return;
    322     }
    323 
    324     if (rsc->mHal.funcs.scriptgroup.execute) {
    325         rsc->mHal.funcs.scriptgroup.execute(rsc, this);
    326         return;
    327     }
    328 
    329     for (size_t ct=0; ct < mNodes.size(); ct++) {
    330         Node *n = mNodes[ct];
    331         //ALOGE("node %i, order %i, in %i out %i", (int)ct, n->mOrder, (int)n->mInputs.size(), (int)n->mOutputs.size());
    332 
    333         for (size_t ct2=0; ct2 < n->mKernels.size(); ct2++) {
    334             const ScriptKernelID *k = n->mKernels[ct2];
    335             Allocation *ain = NULL;
    336             Allocation *aout = NULL;
    337 
    338             for (size_t ct3=0; ct3 < n->mInputs.size(); ct3++) {
    339                 if (n->mInputs[ct3]->mDstKernel.get() == k) {
    340                     ain = n->mInputs[ct3]->mAlloc.get();
    341                     //ALOGE(" link in %p", ain);
    342                 }
    343             }
    344             for (size_t ct3=0; ct3 < mInputs.size(); ct3++) {
    345                 if (mInputs[ct3]->mKernel == k) {
    346                     ain = mInputs[ct3]->mAlloc.get();
    347                     //ALOGE(" io in %p", ain);
    348                 }
    349             }
    350 
    351             for (size_t ct3=0; ct3 < n->mOutputs.size(); ct3++) {
    352                 if (n->mOutputs[ct3]->mSource.get() == k) {
    353                     aout = n->mOutputs[ct3]->mAlloc.get();
    354                     //ALOGE(" link out %p", aout);
    355                 }
    356             }
    357             for (size_t ct3=0; ct3 < mOutputs.size(); ct3++) {
    358                 if (mOutputs[ct3]->mKernel == k) {
    359                     aout = mOutputs[ct3]->mAlloc.get();
    360                     //ALOGE(" io out %p", aout);
    361                 }
    362             }
    363 
    364             if (ain == NULL) {
    365                 n->mScript->runForEach(rsc, k->mSlot, NULL, 0, aout, NULL, 0);
    366 
    367             } else {
    368                 const Allocation *ains[1] = {ain};
    369                 n->mScript->runForEach(rsc, k->mSlot, ains,
    370                                        sizeof(ains) / sizeof(RsAllocation),
    371                                        aout, NULL, 0);
    372             }
    373         }
    374 
    375     }
    376 
    377 }
    378 
    379 ScriptGroup::Link::Link() {
    380 }
    381 
    382 ScriptGroup::Link::~Link() {
    383 }
    384 
    385 namespace android {
    386 namespace renderscript {
    387 
    388 
    389 RsScriptGroup rsi_ScriptGroupCreate(Context *rsc,
    390                            RsScriptKernelID * kernels, size_t kernelsSize,
    391                            RsScriptKernelID * src, size_t srcSize,
    392                            RsScriptKernelID * dstK, size_t dstKSize,
    393                            RsScriptFieldID * dstF, size_t dstFSize,
    394                            const RsType * type, size_t typeSize) {
    395 
    396 
    397     return ScriptGroup::create(rsc,
    398                                (ScriptKernelID **) kernels, kernelsSize,
    399                                (ScriptKernelID **) src, srcSize,
    400                                (ScriptKernelID **) dstK, dstKSize,
    401                                (ScriptFieldID  **) dstF, dstFSize,
    402                                (const Type **) type, typeSize);
    403 }
    404 
    405 
    406 void rsi_ScriptGroupSetInput(Context *rsc, RsScriptGroup sg, RsScriptKernelID kid,
    407         RsAllocation alloc) {
    408     //ALOGE("rsi_ScriptGroupSetInput");
    409     ScriptGroup *s = (ScriptGroup *)sg;
    410     s->setInput(rsc, (ScriptKernelID *)kid, (Allocation *)alloc);
    411 }
    412 
    413 void rsi_ScriptGroupSetOutput(Context *rsc, RsScriptGroup sg, RsScriptKernelID kid,
    414         RsAllocation alloc) {
    415     //ALOGE("rsi_ScriptGroupSetOutput");
    416     ScriptGroup *s = (ScriptGroup *)sg;
    417     s->setOutput(rsc, (ScriptKernelID *)kid, (Allocation *)alloc);
    418 }
    419 
    420 void rsi_ScriptGroupExecute(Context *rsc, RsScriptGroup sg) {
    421     ScriptGroupBase *s = (ScriptGroupBase *)sg;
    422     s->execute(rsc);
    423 }
    424 
    425 }
    426 }
    427