diff options
Diffstat (limited to 'subversion/libsvn_subr/eol.c')
-rw-r--r-- | subversion/libsvn_subr/eol.c | 108 |
1 files changed, 108 insertions, 0 deletions
diff --git a/subversion/libsvn_subr/eol.c b/subversion/libsvn_subr/eol.c new file mode 100644 index 0000000..88a6a37 --- /dev/null +++ b/subversion/libsvn_subr/eol.c @@ -0,0 +1,108 @@ +/* + * eol.c : generic eol/keyword routines + * + * ==================================================================== + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + * ==================================================================== + */ + + + +#define APR_WANT_STRFUNC + +#include <apr_file_io.h> +#include "svn_io.h" +#include "private/svn_eol_private.h" +#include "private/svn_dep_compat.h" + +/* Machine-word-sized masks used in svn_eol__find_eol_start. + */ +char * +svn_eol__find_eol_start(char *buf, apr_size_t len) +{ +#if !SVN_UNALIGNED_ACCESS_IS_OK + + /* On some systems, we need to make sure that buf is properly aligned + * for chunky data access. This overhead is still justified because + * only lines tend to be tens of chars long. + */ + for (; (len > 0) && ((apr_uintptr_t)buf) & (sizeof(apr_uintptr_t)-1) + ; ++buf, --len) + { + if (*buf == '\n' || *buf == '\r') + return buf; + } + +#endif + + /* Scan the input one machine word at a time. */ + for (; len > sizeof(apr_uintptr_t) + ; buf += sizeof(apr_uintptr_t), len -= sizeof(apr_uintptr_t)) + { + /* This is a variant of the well-known strlen test: */ + apr_uintptr_t chunk = *(const apr_uintptr_t *)buf; + + /* A byte in SVN__R_TEST is \0, iff it was \r in *BUF. + * Similarly, SVN__N_TEST is an indicator for \n. */ + apr_uintptr_t r_test = chunk ^ SVN__R_MASK; + apr_uintptr_t n_test = chunk ^ SVN__N_MASK; + + /* A byte in SVN__R_TEST can by < 0x80, iff it has been \0 before + * (i.e. \r in *BUF). Dito for SVN__N_TEST. */ + r_test |= (r_test & SVN__LOWER_7BITS_SET) + SVN__LOWER_7BITS_SET; + n_test |= (n_test & SVN__LOWER_7BITS_SET) + SVN__LOWER_7BITS_SET; + + /* Check whether at least one of the words contains a byte <0x80 + * (if one is detected, there was a \r or \n in CHUNK). */ + if ((r_test & n_test & SVN__BIT_7_SET) != SVN__BIT_7_SET) + break; + } + + /* The remaining odd bytes will be examined the naive way: */ + for (; len > 0; ++buf, --len) + { + if (*buf == '\n' || *buf == '\r') + return buf; + } + + return NULL; +} + +const char * +svn_eol__detect_eol(char *buf, apr_size_t len, char **eolp) +{ + char *eol; + + eol = svn_eol__find_eol_start(buf, len); + if (eol) + { + if (eolp) + *eolp = eol; + + if (*eol == '\n') + return "\n"; + + /* We found a CR. */ + ++eol; + if (eol == buf + len || *eol != '\n') + return "\r"; + return "\r\n"; + } + + return NULL; +} |