git/hex.h

#ifndef HEX_H
#define HEX_H

#include "hash.h"
#include "hex-ll.h"

/*
 * Try to read a hash (specified by the_hash_algo) in hexadecimal
 * format from the 40 (or whatever length the hash algorithm uses)
 * characters starting at hex.  Write the 20-byte (or the length of
 * the hash) result to hash in binary form.
 * Return 0 on success.  Reading stops if a NUL is encountered in the
 * input, so it is safe to pass this function an arbitrary
 * null-terminated string.
 */
int get_oid_hex_algop(const char *hex, struct object_id *oid, const struct git_hash_algo *algop);

/*
 * Convert a binary hash in "unsigned char []" or an object name in
 * "struct object_id *" to its hex equivalent. The `_r` variant is reentrant,
 * and writes the NUL-terminated output to the buffer `out`, which must be at
 * least `GIT_MAX_HEXSZ + 1` bytes, and returns a pointer to out for
 * convenience.
 *
 * The non-`_r` variant returns a static buffer, but uses a ring of 4
 * buffers, making it safe to make multiple calls for a single statement, like:
 *
 *   printf("%s -> %s", hash_to_hex(one), hash_to_hex(two));
 *   printf("%s -> %s", oid_to_hex(one), oid_to_hex(two));
 */
char *hash_to_hex_algop_r(char *buffer, const unsigned char *hash, const struct git_hash_algo *);
char *oid_to_hex_r(char *out, const struct object_id *oid);
char *hash_to_hex_algop(const unsigned char *hash, const struct git_hash_algo *);	/* static buffer result! */
char *oid_to_hex(const struct object_id *oid);						/* same static buffer */

/*
 * Parse a 40-character hexadecimal object ID starting from hex, updating the
 * pointer specified by end when parsing stops.  The resulting object ID is
 * stored in oid.  Returns 0 on success.  Parsing will stop on the first NUL or
 * other invalid character.  end is only updated on success; otherwise, it is
 * unmodified.
 */
int parse_oid_hex_algop(const char *hex, struct object_id *oid, const char **end,
			const struct git_hash_algo *algo);

/*
 * These functions work like get_oid_hex and parse_oid_hex, but they will parse
 * a hex value for any algorithm. The algorithm is detected based on the length
 * and the algorithm in use is returned. If this is not a hex object ID in any
 * algorithm, returns GIT_HASH_UNKNOWN.
 */
int get_oid_hex_any(const char *hex, struct object_id *oid);
int parse_oid_hex_any(const char *hex, struct object_id *oid, const char **end);

#ifdef USE_THE_REPOSITORY_VARIABLE

/* Like get_oid_hex_algop, but for `the_hash_algo`. */
int get_hash_hex(const char *hex, unsigned char *hash);
int get_oid_hex(const char *hex, struct object_id *oid);

/* Like parse_oid_hex_algop, but uses `the_hash_algo`. */
int parse_oid_hex(const char *hex, struct object_id *oid, const char **end);

/*
 * Same as `hash_to_hex_algop()`, but uses `the_hash_algo`.
 */
char *hash_to_hex(const unsigned char *hash);

#endif /* USE_THE_REPOSITORY_VARIABLE */
#endif /* HEX_H */
hex.h: move some hex-related declarations from cache.h hex.c contains code for hex-related functions, but for some reason these functions were declared in the catch-all cache.h. Move the function declarations into a hex.h header instead. This also allows us to remove includes of cache.h from a few C files. For now, we make cache.h include hex.h, so that it is easier to review the direct changes being made by this patch. In the next patch, we will remove that, and add the necessary direct '#include "hex.h"' in the hundreds of C files that need it. Note that reviewing the header changes in this commit might be simplified via git log --no-walk -p --color-moved $COMMIT -- '*.h'` In particular, it highlights the simple movement of code in .h files rather nicely. Signed-off-by: Elijah Newren <newren@gmail.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2023-02-24 00:09:26 +00:00			`#ifndef HEX_H`
			`#define HEX_H`

hash-ll: merge with "hash.h" The "hash-ll.h" header was introduced via d1cbe1e6d8 (hash-ll.h: split out of hash.h to remove dependency on repository.h, 2023-04-22) to make explicit the split between hash-related functions that rely on the global `the_repository`, and those that don't. This split is no longer necessary now that we we have removed the reliance on `the_repository`. Merge "hash-ll.h" back into "hash.h". This causes some code units to not include "repository.h" anymore, which requires us to add some forward declarations. Signed-off-by: Patrick Steinhardt <ps@pks.im> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2024-06-14 06:50:32 +00:00			`#include "hash.h"`
hex-ll: separate out non-hash-algo functions In order to further reduce all-in-one headers, separate out functions in hex.h that do not operate on object hashes into its own file, hex-ll.h, and update the include directives in the .c files that need only such functions accordingly. Signed-off-by: Calvin Wan <calvinwan@google.com> Signed-off-by: Jonathan Tan <jonathantanmy@google.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2023-09-29 21:20:48 +00:00			`#include "hex-ll.h"`
hex.h: move some hex-related declarations from cache.h hex.c contains code for hex-related functions, but for some reason these functions were declared in the catch-all cache.h. Move the function declarations into a hex.h header instead. This also allows us to remove includes of cache.h from a few C files. For now, we make cache.h include hex.h, so that it is easier to review the direct changes being made by this patch. In the next patch, we will remove that, and add the necessary direct '#include "hex.h"' in the hundreds of C files that need it. Note that reviewing the header changes in this commit might be simplified via git log --no-walk -p --color-moved $COMMIT -- '*.h'` In particular, it highlights the simple movement of code in .h files rather nicely. Signed-off-by: Elijah Newren <newren@gmail.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2023-02-24 00:09:26 +00:00
			`/*`
hex: retire get_sha1_hex() The naming convention around get_sha1_hex() and its friends is awkward these days, after "struct object_id" was introduced. There are three public functions around this area: * get_sha1_hex() - use the implied the_hash_algo, fill uchar * * get_oid_hex() - use the implied the_hash_algo, fill oid * * get_oid_hex_algop() - use the passed algop, fill oid * Between the latter two, the "_algop" suffix signals whether the the_hash_algo is used as the implied algorithm or the caller should pass an algorithm explicitly. That is very much understandable and is a good convention. Between the former two, however, the "SHA1" vs "OID" in the names differentiate in what type of variable the result is stored. We could argue that it makes sense to use "SHA1" to mean "flat byte buffer" to honor the historical practice in the days before "struct object_id" was invented, but the natural fourth friend of the above group would take an algop and fill a flat byte buffer, and it would be strange to name it get_sha1_hex_algop(). Do we use the passed in algo, or are we limited to SHA-1 ;-)? In fact, such a function exists, albeit as a private helper function used by the implementation of these functions, and is named a lot more sensibly: get_hash_hex_algop(). Correct the misnomer of get_sha1_hex() and use "hash", instead of "sha1", as "flat byte buffer that stores binary (as opposed to hexadecimal) representation of the hash". The four (2x2) friends now become: * get_hash_hex() - use the implied the_hash_algo, fill uchar * * get_oid_hex() - use the implied the_hash_algo, fill oid * * get_hash_hex_algop() - use the passed algop, fill uchar * * get_oid_hex_algop() - use the passed algop, fill oid * As there are only two remaining calls to get_sha1_hex() in the codebase right now, the blast radious of this change is fairly small. Signed-off-by: Junio C Hamano <gitster@pobox.com> 2023-07-24 23:11:03 +00:00			`* Try to read a hash (specified by the_hash_algo) in hexadecimal`
			`* format from the 40 (or whatever length the hash algorithm uses)`
			`* characters starting at hex. Write the 20-byte (or the length of`
			`* the hash) result to hash in binary form.`
hex.h: move some hex-related declarations from cache.h hex.c contains code for hex-related functions, but for some reason these functions were declared in the catch-all cache.h. Move the function declarations into a hex.h header instead. This also allows us to remove includes of cache.h from a few C files. For now, we make cache.h include hex.h, so that it is easier to review the direct changes being made by this patch. In the next patch, we will remove that, and add the necessary direct '#include "hex.h"' in the hundreds of C files that need it. Note that reviewing the header changes in this commit might be simplified via git log --no-walk -p --color-moved $COMMIT -- '*.h'` In particular, it highlights the simple movement of code in .h files rather nicely. Signed-off-by: Elijah Newren <newren@gmail.com> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2023-02-24 00:09:26 +00:00			`* Return 0 on success. Reading stops if a NUL is encountered in the`
			`* input, so it is safe to pass this function an arbitrary`
			`* null-terminated string.`
			`*/`
			`int get_oid_hex_algop(const char hex, struct object_id oid, const struct git_hash_algo *algop);`

			`/*`
			`* Convert a binary hash in "unsigned char []" or an object name in`
			* "struct object_id *" to its hex equivalent. The `_r` variant is reentrant,
			* and writes the NUL-terminated output to the buffer `out`, which must be at
			* least `GIT_MAX_HEXSZ + 1` bytes, and returns a pointer to out for
			`* convenience.`
			`*`
			* The non-`_r` variant returns a static buffer, but uses a ring of 4
			`* buffers, making it safe to make multiple calls for a single statement, like:`
			`*`
			`* printf("%s -> %s", hash_to_hex(one), hash_to_hex(two));`
			`* printf("%s -> %s", oid_to_hex(one), oid_to_hex(two));`
			`*/`
			`char hash_to_hex_algop_r(char buffer, const unsigned char hash, const struct git_hash_algo );`
			`char oid_to_hex_r(char out, const struct object_id *oid);`
			`char hash_to_hex_algop(const unsigned char hash, const struct git_hash_algo ); / static buffer result! */`
			`char oid_to_hex(const struct object_id oid); /* same static buffer */`

			`/*`
			`* Parse a 40-character hexadecimal object ID starting from hex, updating the`
			`* pointer specified by end when parsing stops. The resulting object ID is`
			`* stored in oid. Returns 0 on success. Parsing will stop on the first NUL or`
			`* other invalid character. end is only updated on success; otherwise, it is`
			`* unmodified.`
			`*/`
			`int parse_oid_hex_algop(const char hex, struct object_id oid, const char **end,`
			`const struct git_hash_algo *algo);`

			`/*`
			`* These functions work like get_oid_hex and parse_oid_hex, but they will parse`
			`* a hex value for any algorithm. The algorithm is detected based on the length`
			`* and the algorithm in use is returned. If this is not a hex object ID in any`
			`* algorithm, returns GIT_HASH_UNKNOWN.`
			`*/`
			`int get_oid_hex_any(const char hex, struct object_id oid);`
			`int parse_oid_hex_any(const char hex, struct object_id oid, const char **end);`

hex: guard declarations with `USE_THE_REPOSITORY_VARIABLE` Guard declarations of functions that implicitly use `the_repository` with `USE_THE_REPOSITORY_VARIABLE` such that callers don't accidentally rely on that global variable. Signed-off-by: Patrick Steinhardt <ps@pks.im> Signed-off-by: Junio C Hamano <gitster@pobox.com> 2024-06-14 06:51:14 +00:00			`#ifdef USE_THE_REPOSITORY_VARIABLE`

			/* Like get_oid_hex_algop, but for `the_hash_algo`. */
			`int get_hash_hex(const char hex, unsigned char hash);`
			`int get_oid_hex(const char hex, struct object_id oid);`

			/* Like parse_oid_hex_algop, but uses `the_hash_algo`. */
			`int parse_oid_hex(const char hex, struct object_id oid, const char **end);`

			`/*`
			* Same as `hash_to_hex_algop()`, but uses `the_hash_algo`.
			`*/`
			`char hash_to_hex(const unsigned char hash);`

			`#endif /* USE_THE_REPOSITORY_VARIABLE */`
			`#endif /* HEX_H */`