The "hash-ll.h" header was introduced via d1cbe1e6d8 (hash-ll.h: split
out of hash.h to remove dependency on repository.h, 2023-04-22) to make
explicit the split between hash-related functions that rely on the
global `the_repository`, and those that don't. This split is no longer
necessary now that we we have removed the reliance on `the_repository`.
Merge "hash-ll.h" back into "hash.h". This causes some code units to not
include "repository.h" anymore, which requires us to add some forward
declarations.
Signed-off-by: Patrick Steinhardt <ps@pks.im>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
		
	
		
			
				
	
	
		
			370 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			370 lines
		
	
	
		
			11 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
#ifndef HASH_H
 | 
						|
#define HASH_H
 | 
						|
 | 
						|
#if defined(SHA1_APPLE)
 | 
						|
#include <CommonCrypto/CommonDigest.h>
 | 
						|
#elif defined(SHA1_OPENSSL)
 | 
						|
#  include <openssl/sha.h>
 | 
						|
#  if defined(OPENSSL_API_LEVEL) && OPENSSL_API_LEVEL >= 3
 | 
						|
#    define SHA1_NEEDS_CLONE_HELPER
 | 
						|
#    include "sha1/openssl.h"
 | 
						|
#  endif
 | 
						|
#elif defined(SHA1_DC)
 | 
						|
#include "sha1dc_git.h"
 | 
						|
#else /* SHA1_BLK */
 | 
						|
#include "block-sha1/sha1.h"
 | 
						|
#endif
 | 
						|
 | 
						|
#if defined(SHA256_NETTLE)
 | 
						|
#include "sha256/nettle.h"
 | 
						|
#elif defined(SHA256_GCRYPT)
 | 
						|
#define SHA256_NEEDS_CLONE_HELPER
 | 
						|
#include "sha256/gcrypt.h"
 | 
						|
#elif defined(SHA256_OPENSSL)
 | 
						|
#  include <openssl/sha.h>
 | 
						|
#  if defined(OPENSSL_API_LEVEL) && OPENSSL_API_LEVEL >= 3
 | 
						|
#    define SHA256_NEEDS_CLONE_HELPER
 | 
						|
#    include "sha256/openssl.h"
 | 
						|
#  endif
 | 
						|
#else
 | 
						|
#include "sha256/block/sha256.h"
 | 
						|
#endif
 | 
						|
 | 
						|
#ifndef platform_SHA_CTX
 | 
						|
/*
 | 
						|
 * platform's underlying implementation of SHA-1; could be OpenSSL,
 | 
						|
 * blk_SHA, Apple CommonCrypto, etc...  Note that the relevant
 | 
						|
 * SHA-1 header may have already defined platform_SHA_CTX for our
 | 
						|
 * own implementations like block-sha1, so we list
 | 
						|
 * the default for OpenSSL compatible SHA-1 implementations here.
 | 
						|
 */
 | 
						|
#define platform_SHA_CTX	SHA_CTX
 | 
						|
#define platform_SHA1_Init	SHA1_Init
 | 
						|
#define platform_SHA1_Update	SHA1_Update
 | 
						|
#define platform_SHA1_Final    	SHA1_Final
 | 
						|
#endif
 | 
						|
 | 
						|
#define git_SHA_CTX		platform_SHA_CTX
 | 
						|
#define git_SHA1_Init		platform_SHA1_Init
 | 
						|
#define git_SHA1_Update		platform_SHA1_Update
 | 
						|
#define git_SHA1_Final		platform_SHA1_Final
 | 
						|
 | 
						|
#ifdef platform_SHA1_Clone
 | 
						|
#define git_SHA1_Clone	platform_SHA1_Clone
 | 
						|
#endif
 | 
						|
 | 
						|
#ifndef platform_SHA256_CTX
 | 
						|
#define platform_SHA256_CTX	SHA256_CTX
 | 
						|
#define platform_SHA256_Init	SHA256_Init
 | 
						|
#define platform_SHA256_Update	SHA256_Update
 | 
						|
#define platform_SHA256_Final	SHA256_Final
 | 
						|
#endif
 | 
						|
 | 
						|
#define git_SHA256_CTX		platform_SHA256_CTX
 | 
						|
#define git_SHA256_Init		platform_SHA256_Init
 | 
						|
#define git_SHA256_Update	platform_SHA256_Update
 | 
						|
#define git_SHA256_Final	platform_SHA256_Final
 | 
						|
 | 
						|
#ifdef platform_SHA256_Clone
 | 
						|
#define git_SHA256_Clone	platform_SHA256_Clone
 | 
						|
#endif
 | 
						|
 | 
						|
#ifdef SHA1_MAX_BLOCK_SIZE
 | 
						|
#include "compat/sha1-chunked.h"
 | 
						|
#undef git_SHA1_Update
 | 
						|
#define git_SHA1_Update		git_SHA1_Update_Chunked
 | 
						|
#endif
 | 
						|
 | 
						|
#ifndef SHA1_NEEDS_CLONE_HELPER
 | 
						|
static inline void git_SHA1_Clone(git_SHA_CTX *dst, const git_SHA_CTX *src)
 | 
						|
{
 | 
						|
	memcpy(dst, src, sizeof(*dst));
 | 
						|
}
 | 
						|
#endif
 | 
						|
 | 
						|
#ifndef SHA256_NEEDS_CLONE_HELPER
 | 
						|
static inline void git_SHA256_Clone(git_SHA256_CTX *dst, const git_SHA256_CTX *src)
 | 
						|
{
 | 
						|
	memcpy(dst, src, sizeof(*dst));
 | 
						|
}
 | 
						|
#endif
 | 
						|
 | 
						|
/*
 | 
						|
 * Note that these constants are suitable for indexing the hash_algos array and
 | 
						|
 * comparing against each other, but are otherwise arbitrary, so they should not
 | 
						|
 * be exposed to the user or serialized to disk.  To know whether a
 | 
						|
 * git_hash_algo struct points to some usable hash function, test the format_id
 | 
						|
 * field for being non-zero.  Use the name field for user-visible situations and
 | 
						|
 * the format_id field for fixed-length fields on disk.
 | 
						|
 */
 | 
						|
/* An unknown hash function. */
 | 
						|
#define GIT_HASH_UNKNOWN 0
 | 
						|
/* SHA-1 */
 | 
						|
#define GIT_HASH_SHA1 1
 | 
						|
/* SHA-256  */
 | 
						|
#define GIT_HASH_SHA256 2
 | 
						|
/* Number of algorithms supported (including unknown). */
 | 
						|
#define GIT_HASH_NALGOS (GIT_HASH_SHA256 + 1)
 | 
						|
 | 
						|
/* "sha1", big-endian */
 | 
						|
#define GIT_SHA1_FORMAT_ID 0x73686131
 | 
						|
 | 
						|
/* The length in bytes and in hex digits of an object name (SHA-1 value). */
 | 
						|
#define GIT_SHA1_RAWSZ 20
 | 
						|
#define GIT_SHA1_HEXSZ (2 * GIT_SHA1_RAWSZ)
 | 
						|
/* The block size of SHA-1. */
 | 
						|
#define GIT_SHA1_BLKSZ 64
 | 
						|
 | 
						|
/* "s256", big-endian */
 | 
						|
#define GIT_SHA256_FORMAT_ID 0x73323536
 | 
						|
 | 
						|
/* The length in bytes and in hex digits of an object name (SHA-256 value). */
 | 
						|
#define GIT_SHA256_RAWSZ 32
 | 
						|
#define GIT_SHA256_HEXSZ (2 * GIT_SHA256_RAWSZ)
 | 
						|
/* The block size of SHA-256. */
 | 
						|
#define GIT_SHA256_BLKSZ 64
 | 
						|
 | 
						|
/* The length in byte and in hex digits of the largest possible hash value. */
 | 
						|
#define GIT_MAX_RAWSZ GIT_SHA256_RAWSZ
 | 
						|
#define GIT_MAX_HEXSZ GIT_SHA256_HEXSZ
 | 
						|
/* The largest possible block size for any supported hash. */
 | 
						|
#define GIT_MAX_BLKSZ GIT_SHA256_BLKSZ
 | 
						|
 | 
						|
struct object_id {
 | 
						|
	unsigned char hash[GIT_MAX_RAWSZ];
 | 
						|
	int algo;	/* XXX requires 4-byte alignment */
 | 
						|
};
 | 
						|
 | 
						|
#define GET_OID_QUIETLY           01
 | 
						|
#define GET_OID_COMMIT            02
 | 
						|
#define GET_OID_COMMITTISH        04
 | 
						|
#define GET_OID_TREE             010
 | 
						|
#define GET_OID_TREEISH          020
 | 
						|
#define GET_OID_BLOB             040
 | 
						|
#define GET_OID_FOLLOW_SYMLINKS 0100
 | 
						|
#define GET_OID_RECORD_PATH     0200
 | 
						|
#define GET_OID_ONLY_TO_DIE    04000
 | 
						|
#define GET_OID_REQUIRE_PATH  010000
 | 
						|
#define GET_OID_HASH_ANY      020000
 | 
						|
 | 
						|
#define GET_OID_DISAMBIGUATORS \
 | 
						|
	(GET_OID_COMMIT | GET_OID_COMMITTISH | \
 | 
						|
	GET_OID_TREE | GET_OID_TREEISH | \
 | 
						|
	GET_OID_BLOB)
 | 
						|
 | 
						|
enum get_oid_result {
 | 
						|
	FOUND = 0,
 | 
						|
	MISSING_OBJECT = -1, /* The requested object is missing */
 | 
						|
	SHORT_NAME_AMBIGUOUS = -2,
 | 
						|
	/* The following only apply when symlinks are followed */
 | 
						|
	DANGLING_SYMLINK = -4, /*
 | 
						|
				* The initial symlink is there, but
 | 
						|
				* (transitively) points to a missing
 | 
						|
				* in-tree file
 | 
						|
				*/
 | 
						|
	SYMLINK_LOOP = -5,
 | 
						|
	NOT_DIR = -6, /*
 | 
						|
		       * Somewhere along the symlink chain, a path is
 | 
						|
		       * requested which contains a file as a
 | 
						|
		       * non-final element.
 | 
						|
		       */
 | 
						|
};
 | 
						|
 | 
						|
#ifdef USE_THE_REPOSITORY_VARIABLE
 | 
						|
# include "repository.h"
 | 
						|
# define the_hash_algo the_repository->hash_algo
 | 
						|
#endif
 | 
						|
 | 
						|
/* A suitably aligned type for stack allocations of hash contexts. */
 | 
						|
union git_hash_ctx {
 | 
						|
	git_SHA_CTX sha1;
 | 
						|
	git_SHA256_CTX sha256;
 | 
						|
};
 | 
						|
typedef union git_hash_ctx git_hash_ctx;
 | 
						|
 | 
						|
typedef void (*git_hash_init_fn)(git_hash_ctx *ctx);
 | 
						|
typedef void (*git_hash_clone_fn)(git_hash_ctx *dst, const git_hash_ctx *src);
 | 
						|
typedef void (*git_hash_update_fn)(git_hash_ctx *ctx, const void *in, size_t len);
 | 
						|
typedef void (*git_hash_final_fn)(unsigned char *hash, git_hash_ctx *ctx);
 | 
						|
typedef void (*git_hash_final_oid_fn)(struct object_id *oid, git_hash_ctx *ctx);
 | 
						|
 | 
						|
struct git_hash_algo {
 | 
						|
	/*
 | 
						|
	 * The name of the algorithm, as appears in the config file and in
 | 
						|
	 * messages.
 | 
						|
	 */
 | 
						|
	const char *name;
 | 
						|
 | 
						|
	/* A four-byte version identifier, used in pack indices. */
 | 
						|
	uint32_t format_id;
 | 
						|
 | 
						|
	/* The length of the hash in binary. */
 | 
						|
	size_t rawsz;
 | 
						|
 | 
						|
	/* The length of the hash in hex characters. */
 | 
						|
	size_t hexsz;
 | 
						|
 | 
						|
	/* The block size of the hash. */
 | 
						|
	size_t blksz;
 | 
						|
 | 
						|
	/* The hash initialization function. */
 | 
						|
	git_hash_init_fn init_fn;
 | 
						|
 | 
						|
	/* The hash context cloning function. */
 | 
						|
	git_hash_clone_fn clone_fn;
 | 
						|
 | 
						|
	/* The hash update function. */
 | 
						|
	git_hash_update_fn update_fn;
 | 
						|
 | 
						|
	/* The hash finalization function. */
 | 
						|
	git_hash_final_fn final_fn;
 | 
						|
 | 
						|
	/* The hash finalization function for object IDs. */
 | 
						|
	git_hash_final_oid_fn final_oid_fn;
 | 
						|
 | 
						|
	/* The OID of the empty tree. */
 | 
						|
	const struct object_id *empty_tree;
 | 
						|
 | 
						|
	/* The OID of the empty blob. */
 | 
						|
	const struct object_id *empty_blob;
 | 
						|
 | 
						|
	/* The all-zeros OID. */
 | 
						|
	const struct object_id *null_oid;
 | 
						|
};
 | 
						|
extern const struct git_hash_algo hash_algos[GIT_HASH_NALGOS];
 | 
						|
 | 
						|
/*
 | 
						|
 * Return a GIT_HASH_* constant based on the name.  Returns GIT_HASH_UNKNOWN if
 | 
						|
 * the name doesn't match a known algorithm.
 | 
						|
 */
 | 
						|
int hash_algo_by_name(const char *name);
 | 
						|
/* Identical, except based on the format ID. */
 | 
						|
int hash_algo_by_id(uint32_t format_id);
 | 
						|
/* Identical, except based on the length. */
 | 
						|
int hash_algo_by_length(int len);
 | 
						|
/* Identical, except for a pointer to struct git_hash_algo. */
 | 
						|
static inline int hash_algo_by_ptr(const struct git_hash_algo *p)
 | 
						|
{
 | 
						|
	return p - hash_algos;
 | 
						|
}
 | 
						|
 | 
						|
const struct object_id *null_oid(void);
 | 
						|
 | 
						|
static inline int hashcmp(const unsigned char *sha1, const unsigned char *sha2, const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	/*
 | 
						|
	 * Teach the compiler that there are only two possibilities of hash size
 | 
						|
	 * here, so that it can optimize for this case as much as possible.
 | 
						|
	 */
 | 
						|
	if (algop->rawsz == GIT_MAX_RAWSZ)
 | 
						|
		return memcmp(sha1, sha2, GIT_MAX_RAWSZ);
 | 
						|
	return memcmp(sha1, sha2, GIT_SHA1_RAWSZ);
 | 
						|
}
 | 
						|
 | 
						|
static inline int hasheq(const unsigned char *sha1, const unsigned char *sha2, const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	/*
 | 
						|
	 * We write this here instead of deferring to hashcmp so that the
 | 
						|
	 * compiler can properly inline it and avoid calling memcmp.
 | 
						|
	 */
 | 
						|
	if (algop->rawsz == GIT_MAX_RAWSZ)
 | 
						|
		return !memcmp(sha1, sha2, GIT_MAX_RAWSZ);
 | 
						|
	return !memcmp(sha1, sha2, GIT_SHA1_RAWSZ);
 | 
						|
}
 | 
						|
 | 
						|
static inline void hashcpy(unsigned char *sha_dst, const unsigned char *sha_src,
 | 
						|
			   const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	memcpy(sha_dst, sha_src, algop->rawsz);
 | 
						|
}
 | 
						|
 | 
						|
static inline void hashclr(unsigned char *hash, const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	memset(hash, 0, algop->rawsz);
 | 
						|
}
 | 
						|
 | 
						|
static inline int oidcmp(const struct object_id *oid1, const struct object_id *oid2)
 | 
						|
{
 | 
						|
	return memcmp(oid1->hash, oid2->hash, GIT_MAX_RAWSZ);
 | 
						|
}
 | 
						|
 | 
						|
static inline int oideq(const struct object_id *oid1, const struct object_id *oid2)
 | 
						|
{
 | 
						|
	return !memcmp(oid1->hash, oid2->hash, GIT_MAX_RAWSZ);
 | 
						|
}
 | 
						|
 | 
						|
static inline void oidcpy(struct object_id *dst, const struct object_id *src)
 | 
						|
{
 | 
						|
	memcpy(dst->hash, src->hash, GIT_MAX_RAWSZ);
 | 
						|
	dst->algo = src->algo;
 | 
						|
}
 | 
						|
 | 
						|
static inline void oidread(struct object_id *oid, const unsigned char *hash,
 | 
						|
			   const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	memcpy(oid->hash, hash, algop->rawsz);
 | 
						|
	if (algop->rawsz < GIT_MAX_RAWSZ)
 | 
						|
		memset(oid->hash + algop->rawsz, 0, GIT_MAX_RAWSZ - algop->rawsz);
 | 
						|
	oid->algo = hash_algo_by_ptr(algop);
 | 
						|
}
 | 
						|
 | 
						|
static inline void oidclr(struct object_id *oid,
 | 
						|
			  const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	memset(oid->hash, 0, GIT_MAX_RAWSZ);
 | 
						|
	oid->algo = hash_algo_by_ptr(algop);
 | 
						|
}
 | 
						|
 | 
						|
static inline struct object_id *oiddup(const struct object_id *src)
 | 
						|
{
 | 
						|
	struct object_id *dst = xmalloc(sizeof(struct object_id));
 | 
						|
	oidcpy(dst, src);
 | 
						|
	return dst;
 | 
						|
}
 | 
						|
 | 
						|
static inline void oid_set_algo(struct object_id *oid, const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	oid->algo = hash_algo_by_ptr(algop);
 | 
						|
}
 | 
						|
 | 
						|
/*
 | 
						|
 * Converts a cryptographic hash (e.g. SHA-1) into an int-sized hash code
 | 
						|
 * for use in hash tables. Cryptographic hashes are supposed to have
 | 
						|
 * uniform distribution, so in contrast to `memhash()`, this just copies
 | 
						|
 * the first `sizeof(int)` bytes without shuffling any bits. Note that
 | 
						|
 * the results will be different on big-endian and little-endian
 | 
						|
 * platforms, so they should not be stored or transferred over the net.
 | 
						|
 */
 | 
						|
static inline unsigned int oidhash(const struct object_id *oid)
 | 
						|
{
 | 
						|
	/*
 | 
						|
	 * Equivalent to 'return *(unsigned int *)oid->hash;', but safe on
 | 
						|
	 * platforms that don't support unaligned reads.
 | 
						|
	 */
 | 
						|
	unsigned int hash;
 | 
						|
	memcpy(&hash, oid->hash, sizeof(hash));
 | 
						|
	return hash;
 | 
						|
}
 | 
						|
 | 
						|
static inline int is_null_oid(const struct object_id *oid)
 | 
						|
{
 | 
						|
	static const unsigned char null_hash[GIT_MAX_RAWSZ];
 | 
						|
	return !memcmp(oid->hash, null_hash, GIT_MAX_RAWSZ);
 | 
						|
}
 | 
						|
 | 
						|
const char *empty_tree_oid_hex(const struct git_hash_algo *algop);
 | 
						|
 | 
						|
static inline int is_empty_blob_oid(const struct object_id *oid,
 | 
						|
				    const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	return oideq(oid, algop->empty_blob);
 | 
						|
}
 | 
						|
 | 
						|
static inline int is_empty_tree_oid(const struct object_id *oid,
 | 
						|
				    const struct git_hash_algo *algop)
 | 
						|
{
 | 
						|
	return oideq(oid, algop->empty_tree);
 | 
						|
}
 | 
						|
 | 
						|
#endif
 |