summaryrefslogtreecommitdiff
path: root/firmware/asm/memset16.c
blob: 7e31df0cddee8946915339380dd32642ac660263 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
/***************************************************************************
 *             __________               __   ___.
 *   Open      \______   \ ____   ____ |  | _\_ |__   _______  ___
 *   Source     |       _//  _ \_/ ___\|  |/ /| __ \ /  _ \  \/  /
 *   Jukebox    |    |   (  <_> )  \___|    < | \_\ (  <_> > <  <
 *   Firmware   |____|_  /\____/ \___  >__|_ \|___  /\____/__/\_ \
 *                     \/            \/     \/    \/            \/
 * $Id$
 *
 * Copyright (C) 2006 by Jens Arnold
 *
 * This program is free software; you can redistribute it and/or
 * modify it under the terms of the GNU General Public License
 * as published by the Free Software Foundation; either version 2
 * of the License, or (at your option) any later version.
 *
 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
 * KIND, either express or implied.
 *
 ****************************************************************************/

#include "string-extra.h" /* memset16() */

#define LBLOCKSIZE (sizeof(long)/2)
#define UNALIGNED(X)   ((long)X & (sizeof(long) - 1))
#define TOO_SMALL(LEN) ((LEN) < LBLOCKSIZE)

void memset16(void *dst, int val, size_t len)
{
#if defined(PREFER_SIZE_OVER_SPEED) || defined(__OPTIMIZE_SIZE__)
    unsigned short *p = (unsigned short *)dst;

    while (len--)
        *p++ = val;
#else
    unsigned short *p = (unsigned short *)dst;
    unsigned int i;
    unsigned long buffer;
    unsigned long *aligned_addr;

    if (!TOO_SMALL(len) && !UNALIGNED(dst))
    {
        aligned_addr = (unsigned long *)dst;

        val &= 0xffff;
        if (LBLOCKSIZE == 2)
        {
            buffer = (val << 16) | val;
        }
        else
        {
            buffer = 0;
            for (i = 0; i < LBLOCKSIZE; i++)
            buffer = (buffer << 16) | val;
        }

        while (len >= LBLOCKSIZE*4)
        {
            *aligned_addr++ = buffer;
            *aligned_addr++ = buffer;
            *aligned_addr++ = buffer;
            *aligned_addr++ = buffer;
            len -= 4*LBLOCKSIZE;
        }

        while (len >= LBLOCKSIZE)
        {
            *aligned_addr++ = buffer;
            len -= LBLOCKSIZE;
        }

        p = (unsigned short *)aligned_addr;
    }

    while (len--)
        *p++ = val;
#endif /* not PREFER_SIZE_OVER_SPEED */
}