LCOV - code coverage report
Current view: top level - src/include/utils - ascii.h (source / functions) Hit Total Coverage
Test: PostgreSQL 18devel Lines: 11 11 100.0 %
Date: 2025-01-18 04:15:08 Functions: 1 1 100.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /*-----------------------------------------------------------------------
       2             :  * ascii.h
       3             :  *
       4             :  *   Portions Copyright (c) 1999-2025, PostgreSQL Global Development Group
       5             :  *
       6             :  * src/include/utils/ascii.h
       7             :  *
       8             :  *-----------------------------------------------------------------------
       9             :  */
      10             : 
      11             : #ifndef _ASCII_H_
      12             : #define _ASCII_H_
      13             : 
      14             : #include "port/simd.h"
      15             : 
      16             : extern void ascii_safe_strlcpy(char *dest, const char *src, size_t destsiz);
      17             : 
      18             : /*
      19             :  * Verify a chunk of bytes for valid ASCII.
      20             :  *
      21             :  * Returns false if the input contains any zero bytes or bytes with the
      22             :  * high-bit set. Input len must be a multiple of the chunk size (8 or 16).
      23             :  */
      24             : static inline bool
      25     3091980 : is_valid_ascii(const unsigned char *s, int len)
      26             : {
      27     3091980 :     const unsigned char *const s_end = s + len;
      28             :     Vector8     chunk;
      29     3091980 :     Vector8     highbit_cum = vector8_broadcast(0);
      30             : #ifdef USE_NO_SIMD
      31             :     Vector8     zero_cum = vector8_broadcast(0x80);
      32             : #endif
      33             : 
      34             :     Assert(len % sizeof(chunk) == 0);
      35             : 
      36     9275940 :     while (s < s_end)
      37             :     {
      38     6183960 :         vector8_load(&chunk, s);
      39             : 
      40             :         /* Capture any zero bytes in this chunk. */
      41             : #ifdef USE_NO_SIMD
      42             : 
      43             :         /*
      44             :          * First, add 0x7f to each byte. This sets the high bit in each byte,
      45             :          * unless it was a zero. If any resulting high bits are zero, the
      46             :          * corresponding high bits in the zero accumulator will be cleared.
      47             :          *
      48             :          * If none of the bytes in the chunk had the high bit set, the max
      49             :          * value each byte can have after the addition is 0x7f + 0x7f = 0xfe,
      50             :          * and we don't need to worry about carrying over to the next byte. If
      51             :          * any input bytes did have the high bit set, it doesn't matter
      52             :          * because we check for those separately.
      53             :          */
      54             :         zero_cum &= (chunk + vector8_broadcast(0x7F));
      55             : #else
      56             : 
      57             :         /*
      58             :          * Set all bits in each lane of the highbit accumulator where input
      59             :          * bytes are zero.
      60             :          */
      61     6183960 :         highbit_cum = vector8_or(highbit_cum,
      62             :                                  vector8_eq(chunk, vector8_broadcast(0)));
      63             : #endif
      64             : 
      65             :         /* Capture all set bits in this chunk. */
      66     6183960 :         highbit_cum = vector8_or(highbit_cum, chunk);
      67             : 
      68     6183960 :         s += sizeof(chunk);
      69             :     }
      70             : 
      71             :     /* Check if any high bits in the high bit accumulator got set. */
      72     3091980 :     if (vector8_is_highbit_set(highbit_cum))
      73        1074 :         return false;
      74             : 
      75             : #ifdef USE_NO_SIMD
      76             :     /* Check if any high bits in the zero accumulator got cleared. */
      77             :     if (zero_cum != vector8_broadcast(0x80))
      78             :         return false;
      79             : #endif
      80             : 
      81     3090906 :     return true;
      82             : }
      83             : 
      84             : #endif                          /* _ASCII_H_ */

Generated by: LCOV version 1.14