123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243 |
- #ifdef HAVE_CONFIG_H
- #include "config.h"
- #endif
- #include "pcre2_internal.h"
- BOOL
- PRIV(is_newline)(PCRE2_SPTR ptr, uint32_t type, PCRE2_SPTR endptr,
- uint32_t *lenptr, BOOL utf)
- {
- uint32_t c;
- #ifdef SUPPORT_UNICODE
- if (utf) { GETCHAR(c, ptr); } else c = *ptr;
- #else
- (void)utf;
- c = *ptr;
- #endif
- if (type == NLTYPE_ANYCRLF) switch(c)
- {
- case CHAR_LF:
- *lenptr = 1;
- return TRUE;
- case CHAR_CR:
- *lenptr = (ptr < endptr - 1 && ptr[1] == CHAR_LF)? 2 : 1;
- return TRUE;
- default:
- return FALSE;
- }
- else switch(c)
- {
- #ifdef EBCDIC
- case CHAR_NEL:
- #endif
- case CHAR_LF:
- case CHAR_VT:
- case CHAR_FF:
- *lenptr = 1;
- return TRUE;
- case CHAR_CR:
- *lenptr = (ptr < endptr - 1 && ptr[1] == CHAR_LF)? 2 : 1;
- return TRUE;
- #ifndef EBCDIC
- #if PCRE2_CODE_UNIT_WIDTH == 8
- case CHAR_NEL:
- *lenptr = utf? 2 : 1;
- return TRUE;
- case 0x2028:
- case 0x2029:
- *lenptr = 3;
- return TRUE;
- #else
- case CHAR_NEL:
- case 0x2028:
- case 0x2029:
- *lenptr = 1;
- return TRUE;
- #endif
- #endif
- default:
- return FALSE;
- }
- }
- BOOL
- PRIV(was_newline)(PCRE2_SPTR ptr, uint32_t type, PCRE2_SPTR startptr,
- uint32_t *lenptr, BOOL utf)
- {
- uint32_t c;
- ptr--;
- #ifdef SUPPORT_UNICODE
- if (utf)
- {
- BACKCHAR(ptr);
- GETCHAR(c, ptr);
- }
- else c = *ptr;
- #else
- (void)utf;
- c = *ptr;
- #endif
- if (type == NLTYPE_ANYCRLF) switch(c)
- {
- case CHAR_LF:
- *lenptr = (ptr > startptr && ptr[-1] == CHAR_CR)? 2 : 1;
- return TRUE;
- case CHAR_CR:
- *lenptr = 1;
- return TRUE;
- default:
- return FALSE;
- }
- else switch(c)
- {
- case CHAR_LF:
- *lenptr = (ptr > startptr && ptr[-1] == CHAR_CR)? 2 : 1;
- return TRUE;
- #ifdef EBCDIC
- case CHAR_NEL:
- #endif
- case CHAR_VT:
- case CHAR_FF:
- case CHAR_CR:
- *lenptr = 1;
- return TRUE;
- #ifndef EBCDIC
- #if PCRE2_CODE_UNIT_WIDTH == 8
- case CHAR_NEL:
- *lenptr = utf? 2 : 1;
- return TRUE;
- case 0x2028:
- case 0x2029:
- *lenptr = 3;
- return TRUE;
- #else
- case CHAR_NEL:
- case 0x2028:
- case 0x2029:
- *lenptr = 1;
- return TRUE;
- #endif
- #endif
- default:
- return FALSE;
- }
- }
|