Home | History | Annotate | Download | only in bionic
      1 /*
      2  * Copyright (C) 2008 The Android Open Source Project
      3  * All rights reserved.
      4  *
      5  * Redistribution and use in source and binary forms, with or without
      6  * modification, are permitted provided that the following conditions
      7  * are met:
      8  *  * Redistributions of source code must retain the above copyright
      9  *    notice, this list of conditions and the following disclaimer.
     10  *  * Redistributions in binary form must reproduce the above copyright
     11  *    notice, this list of conditions and the following disclaimer in
     12  *    the documentation and/or other materials provided with the
     13  *    distribution.
     14  *
     15  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     16  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     17  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
     18  * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
     19  * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
     20  * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
     21  * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS
     22  * OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED
     23  * AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
     24  * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
     25  * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
     26  * SUCH DAMAGE.
     27  */
     28 
     29 #include <string.h>
     30 #include <stdint.h>
     31 
     32 size_t strlen_generic(const char *s)
     33 {
     34     __builtin_prefetch(s);
     35     __builtin_prefetch(s+32);
     36 
     37     union {
     38         const char      *b;
     39         const uint32_t  *w;
     40         uintptr_t       i;
     41     } u;
     42 
     43     // these are some scratch variables for the asm code below
     44     uint32_t v, t;
     45 
     46     // initialize the string length to zero
     47     size_t l = 0;
     48 
     49     // align the pointer to a 32-bit word boundary
     50     u.b = s;
     51     while (u.i & 0x3)  {
     52         if (__builtin_expect(*u.b++ == 0, 0)) {
     53             goto done;
     54         }
     55         l++;
     56     }
     57 
     58     // loop for each word, testing if it contains a zero byte
     59     // if so, exit the loop and update the length.
     60     // We need to process 32 bytes per loop to schedule PLD properly
     61     // and achieve the maximum bus speed.
     62     asm(
     63         "ldr     %[v], [%[s]], #4           \n"
     64         "sub     %[l], %[l], %[s]           \n"
     65         "0:                                 \n"
     66         "pld     [%[s], #64]                \n"
     67         "sub     %[t], %[v], %[mask], lsr #7\n"
     68         "and     %[t], %[t], %[mask]        \n"
     69         "bics    %[t], %[t], %[v]           \n"
     70         "bne     1f                         \n"
     71         "ldr     %[v], [%[s]], #4           \n"
     72 #if !defined(__OPTIMIZE_SIZE__)
     73         "sub     %[t], %[v], %[mask], lsr #7\n"
     74         "and     %[t], %[t], %[mask]        \n"
     75         "bics    %[t], %[t], %[v]           \n"
     76         "bne     1f                         \n"
     77         "ldr     %[v], [%[s]], #4           \n"
     78         "sub     %[t], %[v], %[mask], lsr #7\n"
     79         "and     %[t], %[t], %[mask]        \n"
     80         "bics    %[t], %[t], %[v]           \n"
     81         "bne     1f                         \n"
     82         "ldr     %[v], [%[s]], #4           \n"
     83         "sub     %[t], %[v], %[mask], lsr #7\n"
     84         "and     %[t], %[t], %[mask]        \n"
     85         "bics    %[t], %[t], %[v]           \n"
     86         "bne     1f                         \n"
     87         "ldr     %[v], [%[s]], #4           \n"
     88         "sub     %[t], %[v], %[mask], lsr #7\n"
     89         "and     %[t], %[t], %[mask]        \n"
     90         "bics    %[t], %[t], %[v]           \n"
     91         "bne     1f                         \n"
     92         "ldr     %[v], [%[s]], #4           \n"
     93         "sub     %[t], %[v], %[mask], lsr #7\n"
     94         "and     %[t], %[t], %[mask]        \n"
     95         "bics    %[t], %[t], %[v]           \n"
     96         "bne     1f                         \n"
     97         "ldr     %[v], [%[s]], #4           \n"
     98         "sub     %[t], %[v], %[mask], lsr #7\n"
     99         "and     %[t], %[t], %[mask]        \n"
    100         "bics    %[t], %[t], %[v]           \n"
    101         "bne     1f                         \n"
    102         "ldr     %[v], [%[s]], #4           \n"
    103         "sub     %[t], %[v], %[mask], lsr #7\n"
    104         "and     %[t], %[t], %[mask]        \n"
    105         "bics    %[t], %[t], %[v]           \n"
    106         "bne     1f                         \n"
    107         "ldr     %[v], [%[s]], #4           \n"
    108 #endif
    109         "b       0b                         \n"
    110         "1:                                 \n"
    111         "add     %[l], %[l], %[s]           \n"
    112         "tst     %[v], #0xFF                \n"
    113         "beq     2f                         \n"
    114         "add     %[l], %[l], #1             \n"
    115         "tst     %[v], #0xFF00              \n"
    116         "beq     2f                         \n"
    117         "add     %[l], %[l], #1             \n"
    118         "tst     %[v], #0xFF0000            \n"
    119         "it      ne                         \n"
    120         "addne   %[l], %[l], #1             \n"
    121         "2:                                 \n"
    122         : [l]"=&r"(l), [v]"=&r"(v), [t]"=&r"(t), [s]"=&r"(u.b)
    123         : "%[l]"(l), "%[s]"(u.b), [mask]"r"(0x80808080UL)
    124         : "cc"
    125     );
    126 
    127 done:
    128     return l;
    129 }
    130