Files
httrack/src/htsencoding.h
Xavier Roche 7e7b06b55a Reword the ethical-use notice in source headers
The old license-header note ("We hereby ask people using this source NOT to
use it in purpose of grabbing emails addresses...") read awkwardly: "in
purpose of", "emails addresses", "on persons", and a one-item bullet list
under an "Important notes:" heading.

Replace it across all source headers, configure/configure.ac, and README with
a single clean sentence, and align the wording everywhere:

  Ethical use: we kindly ask that you NOT use this software to harvest email
  addresses or to collect any other private information about people. Doing so
  would dishonor our work and waste the many hours we have spent on it.

Pure text change, no behavior impact.

Co-Authored-By: Claude Opus 4.8 <noreply@anthropic.com>
Signed-off-by: Xavier Roche <roche@httrack.com>
2026-06-14 18:38:17 +02:00

93 lines
3.4 KiB
C

/* ------------------------------------------------------------ */
/*
HTTrack Website Copier, Offline Browser for Windows and Unix
Copyright (C) 2013 Xavier Roche and other contributors
SPDX-License-Identifier: GPL-3.0-or-later
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see <http://www.gnu.org/licenses/>.
Ethical use: we kindly ask that you NOT use this software to harvest email
addresses or to collect any other private information about people. Doing so
would dishonor our work and waste the many hours we have spent on it.
Please visit our Website: http://www.httrack.com
*/
/* ------------------------------------------------------------ */
/* File: Encoding conversion functions */
/* Author: Xavier Roche */
/* ------------------------------------------------------------ */
#ifndef HTS_ENCODING_DEFH
#define HTS_ENCODING_DEFH
/** Standard includes. **/
#include <stdlib.h>
#include <string.h>
#ifdef _WIN32
#include <windows.h>
#endif
/**
* Flags for hts_unescapeUrlSpecial().
**/
typedef enum unescapeFlags {
/** Do not decode ASCII. **/
UNESCAPE_URL_NO_ASCII = 1
} unescapeFlags;
/**
* Unescape HTML entities (as per HTML 4.0 Specification)
* and replace them in-place by their UTF-8 equivalents.
* Note: source and destination may be the same, and the destination only
* needs to hold as space as the source.
* Returns 0 upon success, -1 upon overflow or error.
**/
extern int hts_unescapeEntities(const char *src,
char *dest, const size_t max);
/**
* Unescape HTML entities (as per HTML 4.0 Specification)
* and replace them in-place by their charset equivalents.
* Note: source and destination may be the same, and the destination only
* needs to hold as space as the source.
* Returns 0 upon success, -1 upon overflow or error.
**/
extern int hts_unescapeEntitiesWithCharset(const char *src,
char *dest, const size_t max,
const char *charset);
/**
* Unescape an URL-encoded string. The implicit charset is UTF-8.
* In case of UTF-8 decoding error inside URL-encoded characters,
* the characters are left undecoded.
* Note: source and destination MUST NOT be the same.
* Returns 0 upon success, -1 upon overflow or error.
**/
extern int hts_unescapeUrl(const char *src, char *dest, const size_t max);
/**
* Unescape an URL-encoded string. The implicit charset is UTF-8.
* In case of UTF-8 decoding error inside URL-encoded characters,
* the characters are left undecoded.
* "flags" is a mask composed of UNESCAPE_URL_XXX constants.
* Note: source and destination MUST NOT be the same.
* Returns 0 upon success, -1 upon overflow or error.
**/
extern int hts_unescapeUrlSpecial(const char *src, char *dest, const size_t max,
const int flags);
#endif