pixel/html/fill__help_8h_source.html

 // Copyright (c) Electronic Arts Inc. All rights reserved.


 #ifndef EASTL_INTERNAL_FILL_HELP_H

 #define EASTL_INTERNAL_FILL_HELP_H


 #if defined(EA_PRAGMA_ONCE_SUPPORTED)

     #pragma once

 #endif


 #include <EASTL/internal/config.h>


 #if defined(EA_COMPILER_MICROSOFT) && (defined(EA_PROCESSOR_X86) || defined(EA_PROCESSOR_X86_64))

 #include <intrin.h>

 #endif


 namespace eastl

 {

     // fill

     //

     // We implement some fill helper functions in order to allow us to optimize it

     // where possible.

     //

     template <bool bIsScalar>

     struct fill_imp

     {

         template <typename ForwardIterator, typename T>

         static void do_fill(ForwardIterator first, ForwardIterator last, const T& value)

         {

             // The C++ standard doesn't specify whether we need to create a temporary

             // or not, but all std STL implementations are written like what we have here.

             for(; first != last; ++first)

                 *first = value;

         }

     };


     template <>

     struct fill_imp<true>

     {

         template <typename ForwardIterator, typename T>

         static void do_fill(ForwardIterator first, ForwardIterator last, const T& value)

         {

             typedef typename eastl::iterator_traits<ForwardIterator>::value_type value_type;

             // We create a temp and fill from that because value might alias to the

             // destination range and so the compiler would be forced into generating

             // less efficient code.

             for(const T temp = value; first != last; ++first)

             {

                 EA_UNUSED(temp);

                 *first = static_cast<value_type>(temp);

             }

         }

     };


     template <typename ForwardIterator, typename T>

     inline void fill(ForwardIterator first, ForwardIterator last, const T& value)

     {

         eastl::fill_imp< is_scalar<T>::value >::do_fill(first, last, value);


         // Possibly better implementation, as it will deal with small PODs as well as scalars:

         // bEasyCopy is true if the type has a trivial constructor (e.g. is a POD) and if

         // it is small. Thus any built-in type or any small user-defined struct will qualify.

         //const bool bEasyCopy = eastl::type_and<eastl::has_trivial_constructor<T>::value,

         //                                       eastl::integral_constant<bool, (sizeof(T) <= 16)>::value;

         //eastl::fill_imp<bEasyCopy>::do_fill(first, last, value);


     }


     #if (defined(EA_COMPILER_GNUC) || defined(__clang__)) && (defined(EA_PROCESSOR_X86) || defined(EA_PROCESSOR_X86_64))

         #if defined(EA_PROCESSOR_X86_64)

             template <typename Value>

             inline void fill(uint64_t* first, uint64_t* last, Value c)

             {

                 uintptr_t count = (uintptr_t)(last - first);

                 uint64_t  value = (uint64_t)(c);


                 __asm__ __volatile__ ("cld\n\t"

                                       "rep stosq\n\t"

                                        : "+c" (count), "+D" (first), "=m" (first)

                                        : "a" (value)

                                        : "cc" );

             }


             template <typename Value>

             inline void fill(int64_t* first, int64_t* last, Value c)

             {

                 uintptr_t count = (uintptr_t)(last - first);

                 int64_t   value = (int64_t)(c);


                 __asm__ __volatile__ ("cld\n\t"

                                       "rep stosq\n\t"

                                        : "+c" (count), "+D" (first), "=m" (first)

                                        : "a" (value)

                                        : "cc" );

             }

         #endif


         template <typename Value>

         inline void fill(uint32_t* first, uint32_t* last, Value c)

         {

             uintptr_t count = (uintptr_t)(last - first);

             uint32_t  value = (uint32_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosl\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

         }


         template <typename Value>

         inline void fill(int32_t* first, int32_t* last, Value c)

         {

             uintptr_t count = (uintptr_t)(last - first);

             int32_t   value = (int32_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosl\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

         }


         template <typename Value>

         inline void fill(uint16_t* first, uint16_t* last, Value c)

         {

             uintptr_t count = (uintptr_t)(last - first);

             uint16_t  value = (uint16_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosw\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

         }


         template <typename Value>

         inline void fill(int16_t* first, int16_t* last, Value c)

         {

             uintptr_t count = (uintptr_t)(last - first);

             int16_t   value = (int16_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosw\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

         }


     #elif defined(EA_COMPILER_MICROSOFT) && (defined(EA_PROCESSOR_X86) || defined(EA_PROCESSOR_X86_64))

         #if defined(EA_PROCESSOR_X86_64)

             template <typename Value>

             inline void fill(uint64_t* first, uint64_t* last, Value c)

             {

                 __stosq(first, (uint64_t)c, (size_t)(last - first));

             }


             template <typename Value>

             inline void fill(int64_t* first, int64_t* last, Value c)

             {

                 __stosq((uint64_t*)first, (uint64_t)c, (size_t)(last - first));

             }

         #endif


         template <typename Value>

         inline void fill(uint32_t* first, uint32_t* last, Value c)

         {

             __stosd((unsigned long*)first, (unsigned long)c, (size_t)(last - first));

         }


         template <typename Value>

         inline void fill(int32_t* first, int32_t* last, Value c)

         {

             __stosd((unsigned long*)first, (unsigned long)c, (size_t)(last - first));

         }


         template <typename Value>

         inline void fill(uint16_t* first, uint16_t* last, Value c)

         {

             __stosw(first, (uint16_t)c, (size_t)(last - first));

         }


         template <typename Value>

         inline void fill(int16_t* first, int16_t* last, Value c)

         {

             __stosw((uint16_t*)first, (uint16_t)c, (size_t)(last - first));

         }

     #endif


     inline void fill(char* first, char* last, const char& c) // It's debateable whether we should use 'char& c' or 'char c' here.

     {

         __builtin_memset(first, (unsigned char)c, (size_t)(last - first));

     }


     inline void fill(char* first, char* last, const int c) // This is used for cases like 'fill(first, last, 0)'.

     {

         __builtin_memset(first, (unsigned char)c, (size_t)(last - first));

     }


     inline void fill(unsigned char* first, unsigned char* last, const unsigned char& c)

     {

         __builtin_memset(first, (unsigned char)c, (size_t)(last - first));

     }


     inline void fill(unsigned char* first, unsigned char* last, const int c)

     {

         __builtin_memset(first, (unsigned char)c, (size_t)(last - first));

     }


     inline void fill(signed char* first, signed char* last, const signed char& c)

     {

         __builtin_memset(first, (unsigned char)c, (size_t)(last - first));

     }


     inline void fill(signed char* first, signed char* last, const int c)

     {

         __builtin_memset(first, (unsigned char)c, (size_t)(last - first));

     }


     #if defined(_MSC_VER) || defined(__BORLANDC__) || defined(__ICL) // ICL = Intel compiler

         inline void fill(bool* first, bool* last, const bool& b)

         {

             __builtin_memset(first, (char)b, (size_t)(last - first));

         }

     #endif


     // fill_n

     //

     // We implement some fill helper functions in order to allow us to optimize it

     // where possible.

     //

     template <bool bIsScalar>

     struct fill_n_imp

     {

         template <typename OutputIterator, typename Size, typename T>

         static OutputIterator do_fill(OutputIterator first, Size n, const T& value)

         {

             for(; n-- > 0; ++first)

                 *first = value;

             return first;

         }

     };


     template <>

     struct fill_n_imp<true>

     {

         template <typename OutputIterator, typename Size, typename T>

         static OutputIterator do_fill(OutputIterator first, Size n, const T& value)

         {

             typedef typename eastl::iterator_traits<OutputIterator>::value_type value_type;


             // We create a temp and fill from that because value might alias to

             // the destination range and so the compiler would be forced into

             // generating less efficient code.

             for(const T temp = value; n-- > 0; ++first)

                 *first = static_cast<value_type>(temp);

             return first;

         }

     };


     template <typename OutputIterator, typename Size, typename T>

     OutputIterator fill_n(OutputIterator first, Size n, const T& value)

     {

         return eastl::fill_n_imp<is_scalar<T>::value>::do_fill(first, n, value);

     }


     template <typename Size>

     inline char* fill_n(char* first, Size n, const char& c)

     {

         return (char*)__builtin_memset(first, (char)c, (size_t)n) + n;

     }


     template <typename Size>

     inline unsigned char* fill_n(unsigned char* first, Size n, const unsigned char& c)

     {

         return (unsigned char*)__builtin_memset(first, (unsigned char)c, (size_t)n) + n;

     }


     template <typename Size>

     inline signed char* fill_n(signed char* first, Size n, const signed char& c)

     {

         return (signed char*)__builtin_memset(first, (signed char)c, n) + (size_t)n;

     }


     #if defined(_MSC_VER) || defined(__BORLANDC__) || defined(__ICL) // ICL = Intel compiler

         template <typename Size>

         inline bool* fill_n(bool* first, Size n, const bool& b)

         {

             return (bool*)__builtin_memset(first, (char)b, n) + (size_t)n;

         }

     #endif


     #if (defined(EA_COMPILER_GNUC) || defined(__clang__)) && (defined(EA_PROCESSOR_X86) || defined(EA_PROCESSOR_X86_64))

         #if defined(EA_PROCESSOR_X86_64)

             template <typename Size, typename Value>

             inline uint64_t* fill_n(uint64_t* first, Size n, Value c)

             {

                 uintptr_t count = (uintptr_t)(n);

                 uint64_t  value = (uint64_t)(c);


                 __asm__ __volatile__ ("cld\n\t"

                                       "rep stosq\n\t"

                                        : "+c" (count), "+D" (first), "=m" (first)

                                        : "a" (value)

                                        : "cc" );

                 return first; // first is updated by the code above.

             }


             template <typename Size, typename Value>

             inline int64_t* fill_n(int64_t* first, Size n, Value c)

             {

                 uintptr_t count = (uintptr_t)(n);

                 int64_t   value = (int64_t)(c);


                 __asm__ __volatile__ ("cld\n\t"

                                       "rep stosq\n\t"

                                        : "+c" (count), "+D" (first), "=m" (first)

                                        : "a" (value)

                                        : "cc" );

                 return first; // first is updated by the code above.

             }

         #endif


         template <typename Size, typename Value>

         inline uint32_t* fill_n(uint32_t* first, Size n, Value c)

         {

             uintptr_t count = (uintptr_t)(n);

             uint32_t  value = (uint32_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosl\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

             return first; // first is updated by the code above.

         }


         template <typename Size, typename Value>

         inline int32_t* fill_n(int32_t* first, Size n, Value c)

         {

             uintptr_t count = (uintptr_t)(n);

             int32_t   value = (int32_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosl\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

             return first; // first is updated by the code above.

         }


         template <typename Size, typename Value>

         inline uint16_t* fill_n(uint16_t* first, Size n, Value c)

         {

             uintptr_t count = (uintptr_t)(n);

             uint16_t  value = (uint16_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosw\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

             return first; // first is updated by the code above.

         }


         template <typename Size, typename Value>

         inline int16_t* fill_n(int16_t* first, Size n, Value c)

         {

             uintptr_t count = (uintptr_t)(n);

             int16_t   value = (int16_t)(c);


             __asm__ __volatile__ ("cld\n\t"

                                   "rep stosw\n\t"

                                    : "+c" (count), "+D" (first), "=m" (first)

                                    : "a" (value)

                                    : "cc" );

             return first; // first is updated by the code above.

         }


     #elif defined(EA_COMPILER_MICROSOFT) && (defined(EA_PROCESSOR_X86) || defined(EA_PROCESSOR_X86_64))

         #if defined(EA_PROCESSOR_X86_64)

             template <typename Size, typename Value>

             inline uint64_t* fill_n(uint64_t* first, Size n, Value c)

             {

                 __stosq(first, (uint64_t)c, (size_t)n);

                 return first + n;

             }


             template <typename Size, typename Value>

             inline int64_t* fill_n(int64_t* first, Size n, Value c)

             {

                 __stosq((uint64_t*)first, (uint64_t)c, (size_t)n);

                 return first + n;

             }

         #endif


         template <typename Size, typename Value>

         inline uint32_t* fill_n(uint32_t* first, Size n, Value c)

         {

             __stosd((unsigned long*)first, (unsigned long)c, (size_t)n);

             return first + n;

         }


         template <typename Size, typename Value>

         inline int32_t* fill_n(int32_t* first, Size n, Value c)

         {

             __stosd((unsigned long*)first, (unsigned long)c, (size_t)n);

             return first + n;

         }


         template <typename Size, typename Value>

         inline uint16_t* fill_n(uint16_t* first, Size n, Value c)

         {

             __stosw(first, (uint16_t)c, (size_t)n);

             return first + n;

         }


         template <typename Size, typename Value>

         inline int16_t* fill_n(int16_t* first, Size n, Value c)

         {

             __stosw((uint16_t*)first, (uint16_t)c, (size_t)n);

             return first + n;

         }

     #endif


 } // namespace eastl


 #endif // Header include guard


eastl
EA Standard Template Library.
Definition: algorithm.h:288

eastl::count
eastl::iterator_traits< InputIterator >::difference_type count(InputIterator first, InputIterator last, const T &value)
Definition: algorithm.h:1347

eastl::fill_n
OutputIterator fill_n(OutputIterator first, Size n, const T &value)
Definition: fill_help.h:299

eastl::fill
void fill(ForwardIterator first, ForwardIterator last, const T &value)
Definition: fill_help.h:75

eastl::fill_imp
Definition: fill_help.h:29

eastl::fill_n_imp
Definition: fill_help.h:261