2005-04-08 00:13:13 +02:00
|
|
|
#ifndef CACHE_H
|
|
|
|
#define CACHE_H
|
|
|
|
|
2005-12-05 20:54:29 +01:00
|
|
|
#include "git-compat-util.h"
|
2005-04-08 00:13:13 +02:00
|
|
|
|
2005-04-21 21:33:22 +02:00
|
|
|
#include SHA1_HEADER
|
2005-04-08 00:13:13 +02:00
|
|
|
#include <zlib.h>
|
|
|
|
|
2005-04-30 18:51:03 +02:00
|
|
|
#if ZLIB_VERNUM < 0x1200
|
|
|
|
#define deflateBound(c,s) ((s) + (((s) + 7) >> 3) + (((s) + 63) >> 6) + 11)
|
|
|
|
#endif
|
|
|
|
|
2006-02-26 16:13:46 +01:00
|
|
|
#if defined(DT_UNKNOWN) && !defined(NO_D_TYPE_IN_DIRENT)
|
2005-04-30 18:51:03 +02:00
|
|
|
#define DTYPE(de) ((de)->d_type)
|
|
|
|
#else
|
2006-01-20 22:33:20 +01:00
|
|
|
#undef DT_UNKNOWN
|
|
|
|
#undef DT_DIR
|
|
|
|
#undef DT_REG
|
|
|
|
#undef DT_LNK
|
2005-04-30 18:51:03 +02:00
|
|
|
#define DT_UNKNOWN 0
|
|
|
|
#define DT_DIR 1
|
|
|
|
#define DT_REG 2
|
2005-05-13 02:16:04 +02:00
|
|
|
#define DT_LNK 3
|
2005-04-30 18:51:03 +02:00
|
|
|
#define DTYPE(de) DT_UNKNOWN
|
|
|
|
#endif
|
|
|
|
|
2005-07-14 03:46:20 +02:00
|
|
|
/*
|
|
|
|
* Intensive research over the course of many years has shown that
|
|
|
|
* port 9418 is totally unused by anything else. Or
|
|
|
|
*
|
|
|
|
* Your search - "port 9418" - did not match any documents.
|
|
|
|
*
|
|
|
|
* as www.google.com puts it.
|
2005-09-12 20:23:00 +02:00
|
|
|
*
|
|
|
|
* This port has been properly assigned for git use by IANA:
|
|
|
|
* git (Assigned-9418) [I06-050728-0001].
|
|
|
|
*
|
|
|
|
* git 9418/tcp git pack transfer service
|
|
|
|
* git 9418/udp git pack transfer service
|
|
|
|
*
|
|
|
|
* with Linus Torvalds <torvalds@osdl.org> as the point of
|
|
|
|
* contact. September 2005.
|
|
|
|
*
|
|
|
|
* See http://www.iana.org/assignments/port-numbers
|
2005-07-14 03:46:20 +02:00
|
|
|
*/
|
|
|
|
#define DEFAULT_GIT_PORT 9418
|
|
|
|
|
2005-04-08 00:13:13 +02:00
|
|
|
/*
|
|
|
|
* Basic data structures for the directory cache
|
|
|
|
*/
|
|
|
|
|
|
|
|
#define CACHE_SIGNATURE 0x44495243 /* "DIRC" */
|
|
|
|
struct cache_header {
|
2005-04-15 19:44:27 +02:00
|
|
|
unsigned int hdr_signature;
|
|
|
|
unsigned int hdr_version;
|
|
|
|
unsigned int hdr_entries;
|
2005-04-08 00:13:13 +02:00
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* The "cache_time" is just the low 32 bits of the
|
|
|
|
* time. It doesn't matter if it overflows - we only
|
|
|
|
* check it for equality in the 32 bits we save.
|
|
|
|
*/
|
|
|
|
struct cache_time {
|
|
|
|
unsigned int sec;
|
|
|
|
unsigned int nsec;
|
|
|
|
};
|
|
|
|
|
|
|
|
/*
|
|
|
|
* dev/ino/uid/gid/size are also just tracked to the low 32 bits
|
|
|
|
* Again - this is just a (very strong in practice) heuristic that
|
|
|
|
* the inode hasn't changed.
|
2005-04-15 19:44:27 +02:00
|
|
|
*
|
|
|
|
* We save the fields in big-endian order to allow using the
|
|
|
|
* index file over NFS transparently.
|
2005-04-08 00:13:13 +02:00
|
|
|
*/
|
|
|
|
struct cache_entry {
|
2005-04-15 19:44:27 +02:00
|
|
|
struct cache_time ce_ctime;
|
|
|
|
struct cache_time ce_mtime;
|
|
|
|
unsigned int ce_dev;
|
|
|
|
unsigned int ce_ino;
|
|
|
|
unsigned int ce_mode;
|
|
|
|
unsigned int ce_uid;
|
|
|
|
unsigned int ce_gid;
|
|
|
|
unsigned int ce_size;
|
2005-04-08 00:13:13 +02:00
|
|
|
unsigned char sha1[20];
|
2005-04-16 06:45:38 +02:00
|
|
|
unsigned short ce_flags;
|
2006-01-07 10:33:54 +01:00
|
|
|
char name[FLEX_ARRAY]; /* more */
|
2005-04-08 00:13:13 +02:00
|
|
|
};
|
|
|
|
|
2005-04-16 07:51:44 +02:00
|
|
|
#define CE_NAMEMASK (0x0fff)
|
|
|
|
#define CE_STAGEMASK (0x3000)
|
2005-06-06 07:07:31 +02:00
|
|
|
#define CE_UPDATE (0x4000)
|
2006-02-09 06:15:24 +01:00
|
|
|
#define CE_VALID (0x8000)
|
2005-04-16 17:33:23 +02:00
|
|
|
#define CE_STAGESHIFT 12
|
2005-04-16 07:51:44 +02:00
|
|
|
|
2005-04-16 17:33:23 +02:00
|
|
|
#define create_ce_flags(len, stage) htons((len) | ((stage) << CE_STAGESHIFT))
|
|
|
|
#define ce_namelen(ce) (CE_NAMEMASK & ntohs((ce)->ce_flags))
|
|
|
|
#define ce_size(ce) cache_entry_size(ce_namelen(ce))
|
|
|
|
#define ce_stage(ce) ((CE_STAGEMASK & ntohs((ce)->ce_flags)) >> CE_STAGESHIFT)
|
|
|
|
|
2005-04-17 07:26:31 +02:00
|
|
|
#define ce_permissions(mode) (((mode) & 0100) ? 0755 : 0644)
|
2005-05-05 14:38:25 +02:00
|
|
|
static inline unsigned int create_ce_mode(unsigned int mode)
|
|
|
|
{
|
|
|
|
if (S_ISLNK(mode))
|
|
|
|
return htonl(S_IFLNK);
|
2005-05-06 01:01:46 +02:00
|
|
|
return htonl(S_IFREG | ce_permissions(mode));
|
2005-05-05 14:38:25 +02:00
|
|
|
}
|
2007-02-17 07:43:48 +01:00
|
|
|
static inline unsigned int ce_mode_from_stat(struct cache_entry *ce, unsigned int mode)
|
|
|
|
{
|
|
|
|
extern int trust_executable_bit;
|
|
|
|
if (!trust_executable_bit && S_ISREG(mode)) {
|
|
|
|
if (ce && S_ISREG(ntohl(ce->ce_mode)))
|
|
|
|
return ce->ce_mode;
|
|
|
|
return create_ce_mode(0666);
|
|
|
|
}
|
|
|
|
return create_ce_mode(mode);
|
|
|
|
}
|
2006-03-30 08:55:43 +02:00
|
|
|
#define canon_mode(mode) \
|
|
|
|
(S_ISREG(mode) ? (S_IFREG | ce_permissions(mode)) : \
|
|
|
|
S_ISLNK(mode) ? S_IFLNK : S_IFDIR)
|
2005-04-17 07:26:31 +02:00
|
|
|
|
2005-04-16 17:33:23 +02:00
|
|
|
#define cache_entry_size(len) ((offsetof(struct cache_entry,name) + (len) + 8) & ~7)
|
2005-04-16 06:45:38 +02:00
|
|
|
|
2005-05-11 00:58:16 +02:00
|
|
|
extern struct cache_entry **active_cache;
|
|
|
|
extern unsigned int active_nr, active_alloc, active_cache_changed;
|
2006-04-25 06:18:58 +02:00
|
|
|
extern struct cache_tree *active_cache_tree;
|
2006-07-26 06:32:18 +02:00
|
|
|
extern int cache_errno;
|
2005-04-08 00:13:13 +02:00
|
|
|
|
2005-05-10 07:57:58 +02:00
|
|
|
#define GIT_DIR_ENVIRONMENT "GIT_DIR"
|
|
|
|
#define DEFAULT_GIT_DIR_ENVIRONMENT ".git"
|
2005-05-10 02:57:56 +02:00
|
|
|
#define DB_ENVIRONMENT "GIT_OBJECT_DIRECTORY"
|
2005-04-21 19:55:18 +02:00
|
|
|
#define INDEX_ENVIRONMENT "GIT_INDEX_FILE"
|
2005-07-30 09:58:28 +02:00
|
|
|
#define GRAFT_ENVIRONMENT "GIT_GRAFT_FILE"
|
2006-12-19 10:28:15 +01:00
|
|
|
#define TEMPLATE_DIR_ENVIRONMENT "GIT_TEMPLATE_DIR"
|
|
|
|
#define CONFIG_ENVIRONMENT "GIT_CONFIG"
|
|
|
|
#define CONFIG_LOCAL_ENVIRONMENT "GIT_CONFIG_LOCAL"
|
|
|
|
#define EXEC_PATH_ENVIRONMENT "GIT_EXEC_PATH"
|
2005-04-21 19:55:18 +02:00
|
|
|
|
2007-01-07 11:00:28 +01:00
|
|
|
extern int is_bare_repository_cfg;
|
|
|
|
extern int is_bare_repository(void);
|
2007-01-20 03:09:34 +01:00
|
|
|
extern int is_inside_git_dir(void);
|
2006-08-23 12:39:11 +02:00
|
|
|
extern const char *get_git_dir(void);
|
2005-05-10 07:57:58 +02:00
|
|
|
extern char *get_object_directory(void);
|
2005-06-06 22:31:29 +02:00
|
|
|
extern char *get_refs_directory(void);
|
2005-05-10 07:57:58 +02:00
|
|
|
extern char *get_index_file(void);
|
2005-07-30 09:58:28 +02:00
|
|
|
extern char *get_graft_file(void);
|
2005-05-10 07:57:58 +02:00
|
|
|
|
|
|
|
#define ALTERNATE_DB_ENVIRONMENT "GIT_ALTERNATE_OBJECT_DIRECTORIES"
|
2005-04-21 19:55:18 +02:00
|
|
|
|
2005-09-21 09:00:47 +02:00
|
|
|
extern const char **get_pathspec(const char *prefix, const char **pathspec);
|
2005-11-26 08:14:15 +01:00
|
|
|
extern const char *setup_git_directory_gently(int *);
|
2005-08-17 03:06:34 +02:00
|
|
|
extern const char *setup_git_directory(void);
|
2005-09-21 09:00:47 +02:00
|
|
|
extern const char *prefix_path(const char *prefix, int len, const char *path);
|
2005-11-26 08:14:15 +01:00
|
|
|
extern const char *prefix_filename(const char *prefix, int len, const char *path);
|
2006-04-26 19:15:54 +02:00
|
|
|
extern void verify_filename(const char *prefix, const char *name);
|
2006-04-27 00:09:27 +02:00
|
|
|
extern void verify_non_filename(const char *prefix, const char *name);
|
2005-08-17 03:06:34 +02:00
|
|
|
|
2005-04-08 00:13:13 +02:00
|
|
|
#define alloc_nr(x) (((x)+16)*3/2)
|
|
|
|
|
2005-04-09 18:48:20 +02:00
|
|
|
/* Initialize and use the cache information */
|
2005-04-08 00:13:13 +02:00
|
|
|
extern int read_cache(void);
|
2006-07-26 06:32:18 +02:00
|
|
|
extern int read_cache_from(const char *path);
|
2005-04-09 21:09:27 +02:00
|
|
|
extern int write_cache(int newfd, struct cache_entry **cache, int entries);
|
Status update on merge-recursive in C
This is just an update for people being interested. Alex and me were
busy with that project for a few days now. While it has progressed nicely,
there are quite a couple TODOs in merge-recursive.c, just search for "TODO".
For impatient people: yes, it passes all the tests, and yes, according
to the evil test Alex did, it is faster than the Python script.
But no, it is not yet finished. Biggest points are:
- there are still three external calls
- in the end, it should not be necessary to write the index more than once
(just before exiting)
- a lot of things can be refactored to make the code easier and shorter
BTW we cannot just plug in git-merge-tree yet, because git-merge-tree
does not handle renames at all.
This patch is meant for testing, and as such,
- it compile the program to git-merge-recur
- it adjusts the scripts and tests to use git-merge-recur instead of
git-merge-recursive
- it provides "TEST", a script to execute the tests regarding -recursive
- it inlines the changes to read-cache.c (read_cache_from(), discard_cache()
and refresh_cache_entry())
Brought to you by Alex Riesen and Dscho
Signed-off-by: Junio C Hamano <junkio@cox.net>
2006-07-08 18:42:41 +02:00
|
|
|
extern int discard_cache(void);
|
2006-05-18 21:07:31 +02:00
|
|
|
extern int verify_path(const char *path);
|
2005-04-09 18:26:55 +02:00
|
|
|
extern int cache_name_pos(const char *name, int namelen);
|
2005-05-08 06:55:21 +02:00
|
|
|
#define ADD_CACHE_OK_TO_ADD 1 /* Ok to add */
|
|
|
|
#define ADD_CACHE_OK_TO_REPLACE 2 /* Ok to replace file/directory */
|
2005-06-25 11:25:29 +02:00
|
|
|
#define ADD_CACHE_SKIP_DFCHECK 4 /* Ok to skip DF conflict checks */
|
2005-05-08 06:55:21 +02:00
|
|
|
extern int add_cache_entry(struct cache_entry *ce, int option);
|
2006-07-26 06:32:18 +02:00
|
|
|
extern struct cache_entry *refresh_cache_entry(struct cache_entry *ce, int really);
|
2005-05-15 04:04:25 +02:00
|
|
|
extern int remove_cache_entry_at(int pos);
|
2005-09-21 09:00:47 +02:00
|
|
|
extern int remove_file_from_cache(const char *path);
|
2006-07-26 03:52:35 +02:00
|
|
|
extern int add_file_to_index(const char *path, int verbose);
|
2005-05-15 04:04:25 +02:00
|
|
|
extern int ce_same_name(struct cache_entry *a, struct cache_entry *b);
|
2006-02-09 06:15:24 +01:00
|
|
|
extern int ce_match_stat(struct cache_entry *ce, struct stat *st, int);
|
|
|
|
extern int ce_modified(struct cache_entry *ce, struct stat *st, int);
|
2005-07-15 01:55:06 +02:00
|
|
|
extern int ce_path_match(const struct cache_entry *ce, const char **pathspec);
|
2005-07-09 01:51:55 +02:00
|
|
|
extern int index_fd(unsigned char *sha1, int fd, struct stat *st, int write_object, const char *type);
|
2006-05-23 20:19:04 +02:00
|
|
|
extern int read_pipe(int fd, char** return_buf, unsigned long* return_size);
|
2005-12-10 23:25:24 +01:00
|
|
|
extern int index_pipe(unsigned char *sha1, int fd, const char *type, int write_object);
|
2005-10-07 12:42:00 +02:00
|
|
|
extern int index_path(unsigned char *sha1, const char *path, struct stat *st, int write_object);
|
2005-05-15 23:23:12 +02:00
|
|
|
extern void fill_stat_cache_info(struct cache_entry *ce, struct stat *st);
|
|
|
|
|
2006-05-19 18:56:35 +02:00
|
|
|
#define REFRESH_REALLY 0x0001 /* ignore_valid */
|
|
|
|
#define REFRESH_UNMERGED 0x0002 /* allow unmerged */
|
|
|
|
#define REFRESH_QUIET 0x0004 /* be quiet about it */
|
|
|
|
#define REFRESH_IGNORE_MISSING 0x0008 /* ignore non-existent */
|
|
|
|
extern int refresh_cache(unsigned int flags);
|
|
|
|
|
2006-06-06 21:51:49 +02:00
|
|
|
struct lock_file {
|
|
|
|
struct lock_file *next;
|
2007-01-02 20:19:05 +01:00
|
|
|
char on_list;
|
2006-06-06 21:51:49 +02:00
|
|
|
char filename[PATH_MAX];
|
2005-05-15 23:23:12 +02:00
|
|
|
};
|
2006-08-12 10:03:47 +02:00
|
|
|
extern int hold_lock_file_for_update(struct lock_file *, const char *path, int);
|
2006-06-06 21:51:49 +02:00
|
|
|
extern int commit_lock_file(struct lock_file *);
|
|
|
|
extern void rollback_lock_file(struct lock_file *);
|
2006-09-27 10:58:57 +02:00
|
|
|
extern int delete_ref(const char *, unsigned char *sha1);
|
2005-04-09 18:48:20 +02:00
|
|
|
|
2006-02-27 23:47:45 +01:00
|
|
|
/* Environment bits from configuration mechanism */
|
2006-07-11 21:48:08 +02:00
|
|
|
extern int use_legacy_headers;
|
2005-10-11 01:31:08 +02:00
|
|
|
extern int trust_executable_bit;
|
2006-02-09 06:15:24 +01:00
|
|
|
extern int assume_unchanged;
|
2006-05-02 09:40:24 +02:00
|
|
|
extern int prefer_symlink_refs;
|
2006-05-17 11:55:40 +02:00
|
|
|
extern int log_all_ref_updates;
|
2006-03-21 03:45:47 +01:00
|
|
|
extern int warn_ambiguous_refs;
|
2005-12-22 23:13:56 +01:00
|
|
|
extern int shared_repository;
|
2006-02-27 23:47:45 +01:00
|
|
|
extern const char *apply_default_whitespace;
|
2006-07-03 22:11:47 +02:00
|
|
|
extern int zlib_compression_level;
|
2006-12-23 08:34:28 +01:00
|
|
|
extern size_t packed_git_window_size;
|
2006-12-23 08:33:35 +01:00
|
|
|
extern size_t packed_git_limit;
|
Lazy man's auto-CRLF
It currently does NOT know about file attributes, so it does its
conversion purely based on content. Maybe that is more in the "git
philosophy" anyway, since content is king, but I think we should try to do
the file attributes to turn it off on demand.
Anyway, BY DEFAULT it is off regardless, because it requires a
[core]
AutoCRLF = true
in your config file to be enabled. We could make that the default for
Windows, of course, the same way we do some other things (filemode etc).
But you can actually enable it on UNIX, and it will cause:
- "git update-index" will write blobs without CRLF
- "git diff" will diff working tree files without CRLF
- "git checkout" will write files to the working tree _with_ CRLF
and things work fine.
Funnily, it actually shows an odd file in git itself:
git clone -n git test-crlf
cd test-crlf
git config core.autocrlf true
git checkout
git diff
shows a diff for "Documentation/docbook-xsl.css". Why? Because we have
actually checked in that file *with* CRLF! So when "core.autocrlf" is
true, we'll always generate a *different* hash for it in the index,
because the index hash will be for the content _without_ CRLF.
Is this complete? I dunno. It seems to work for me. It doesn't use the
filename at all right now, and that's probably a deficiency (we could
certainly make the "is_binary()" heuristics also take standard filename
heuristics into account).
I don't pass in the filename at all for the "index_fd()" case
(git-update-index), so that would need to be passed around, but this
actually works fine.
NOTE NOTE NOTE! The "is_binary()" heuristics are totally made-up by yours
truly. I will not guarantee that they work at all reasonable. Caveat
emptor. But it _is_ simple, and it _is_ safe, since it's all off by
default.
The patch is pretty simple - the biggest part is the new "convert.c" file,
but even that is really just basic stuff that anybody can write in
"Teaching C 101" as a final project for their first class in programming.
Not to say that it's bug-free, of course - but at least we're not talking
about rocket surgery here.
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Signed-off-by: Junio C Hamano <junkio@cox.net>
2007-02-13 20:07:23 +01:00
|
|
|
extern int auto_crlf;
|
2005-10-11 01:31:08 +02:00
|
|
|
|
2005-11-26 00:59:09 +01:00
|
|
|
#define GIT_REPO_VERSION 0
|
|
|
|
extern int repository_format_version;
|
|
|
|
extern int check_repository_format(void);
|
|
|
|
|
2005-04-09 18:48:20 +02:00
|
|
|
#define MTIME_CHANGED 0x0001
|
|
|
|
#define CTIME_CHANGED 0x0002
|
|
|
|
#define OWNER_CHANGED 0x0004
|
|
|
|
#define MODE_CHANGED 0x0008
|
|
|
|
#define INODE_CHANGED 0x0010
|
|
|
|
#define DATA_CHANGED 0x0020
|
2005-05-05 14:38:25 +02:00
|
|
|
#define TYPE_CHANGED 0x0040
|
2005-04-08 00:13:13 +02:00
|
|
|
|
|
|
|
/* Return a statically allocated filename matching the sha1 signature */
|
2005-08-09 17:30:22 +02:00
|
|
|
extern char *mkpath(const char *fmt, ...) __attribute__((format (printf, 1, 2)));
|
|
|
|
extern char *git_path(const char *fmt, ...) __attribute__((format (printf, 1, 2)));
|
2005-04-10 23:03:58 +02:00
|
|
|
extern char *sha1_file_name(const unsigned char *sha1);
|
2005-08-01 02:53:44 +02:00
|
|
|
extern char *sha1_pack_name(const unsigned char *sha1);
|
|
|
|
extern char *sha1_pack_index_name(const unsigned char *sha1);
|
2005-10-12 00:22:48 +02:00
|
|
|
extern const char *find_unique_abbrev(const unsigned char *sha1, int);
|
2005-09-30 23:02:47 +02:00
|
|
|
extern const unsigned char null_sha1[20];
|
2006-08-15 22:37:19 +02:00
|
|
|
static inline int is_null_sha1(const unsigned char *sha1)
|
|
|
|
{
|
|
|
|
return !memcmp(sha1, null_sha1, 20);
|
|
|
|
}
|
2006-08-17 20:54:57 +02:00
|
|
|
static inline int hashcmp(const unsigned char *sha1, const unsigned char *sha2)
|
|
|
|
{
|
|
|
|
return memcmp(sha1, sha2, 20);
|
|
|
|
}
|
2006-08-23 08:49:00 +02:00
|
|
|
static inline void hashcpy(unsigned char *sha_dst, const unsigned char *sha_src)
|
|
|
|
{
|
|
|
|
memcpy(sha_dst, sha_src, 20);
|
|
|
|
}
|
2006-08-23 22:57:23 +02:00
|
|
|
static inline void hashclr(unsigned char *hash)
|
|
|
|
{
|
|
|
|
memset(hash, 0, 20);
|
|
|
|
}
|
2005-04-08 00:13:13 +02:00
|
|
|
|
2005-08-04 22:43:03 +02:00
|
|
|
int git_mkstemp(char *path, size_t n, const char *template);
|
|
|
|
|
2006-06-10 08:09:49 +02:00
|
|
|
enum sharedrepo {
|
|
|
|
PERM_UMASK = 0,
|
|
|
|
PERM_GROUP,
|
|
|
|
PERM_EVERYBODY
|
|
|
|
};
|
|
|
|
int git_config_perm(const char *var, const char *value);
|
2005-12-22 23:13:56 +01:00
|
|
|
int adjust_shared_perm(const char *path);
|
2005-07-06 10:11:52 +02:00
|
|
|
int safe_create_leading_directories(char *path);
|
2005-11-21 01:52:52 +01:00
|
|
|
char *enter_repo(char *path, int strict);
|
2005-07-06 10:11:52 +02:00
|
|
|
|
2005-04-08 00:13:13 +02:00
|
|
|
/* Read and unpack a sha1 file into memory, write memory to a sha1 file */
|
2005-06-27 12:34:06 +02:00
|
|
|
extern int sha1_object_info(const unsigned char *, char *, unsigned long *);
|
2005-04-09 00:01:15 +02:00
|
|
|
extern void * unpack_sha1_file(void *map, unsigned long mapsize, char *type, unsigned long *size);
|
2005-04-10 23:03:58 +02:00
|
|
|
extern void * read_sha1_file(const unsigned char *sha1, char *type, unsigned long *size);
|
2006-10-14 12:45:36 +02:00
|
|
|
extern int hash_sha1_file(void *buf, unsigned long len, const char *type, unsigned char *sha1);
|
2005-05-18 14:14:09 +02:00
|
|
|
extern int write_sha1_file(void *buf, unsigned long len, const char *type, unsigned char *return_sha1);
|
2007-02-05 06:42:38 +01:00
|
|
|
extern int pretend_sha1_file(void *, unsigned long, const char *, unsigned char *);
|
2005-04-24 03:47:23 +02:00
|
|
|
|
2005-06-03 17:05:39 +02:00
|
|
|
extern int check_sha1_signature(const unsigned char *sha1, void *buf, unsigned long size, const char *type);
|
2005-04-08 00:13:13 +02:00
|
|
|
|
2005-08-03 01:46:29 +02:00
|
|
|
extern int write_sha1_from_fd(const unsigned char *sha1, int fd, char *buffer,
|
|
|
|
size_t bufsize, size_t *bufposn);
|
2005-07-11 00:25:38 +02:00
|
|
|
extern int write_sha1_to_fd(int fd, const unsigned char *sha1);
|
2006-09-01 09:17:47 +02:00
|
|
|
extern int move_temp_to_file(const char *tmpfile, const char *filename);
|
2005-04-24 03:47:23 +02:00
|
|
|
|
2006-09-06 11:12:09 +02:00
|
|
|
extern int has_sha1_pack(const unsigned char *sha1, const char **ignore);
|
2005-04-24 03:47:23 +02:00
|
|
|
extern int has_sha1_file(const unsigned char *sha1);
|
2006-07-18 00:04:47 +02:00
|
|
|
extern void *map_sha1_file(const unsigned char *sha1, unsigned long *);
|
|
|
|
extern int legacy_loose_object(unsigned char *);
|
2005-04-24 03:47:23 +02:00
|
|
|
|
2005-08-01 02:53:44 +02:00
|
|
|
extern int has_pack_file(const unsigned char *sha1);
|
|
|
|
extern int has_pack_index(const unsigned char *sha1);
|
|
|
|
|
2006-09-04 06:09:18 +02:00
|
|
|
enum object_type {
|
|
|
|
OBJ_NONE = 0,
|
|
|
|
OBJ_COMMIT = 1,
|
|
|
|
OBJ_TREE = 2,
|
|
|
|
OBJ_BLOB = 3,
|
|
|
|
OBJ_TAG = 4,
|
2006-09-21 06:06:49 +02:00
|
|
|
/* 5 for future expansion */
|
|
|
|
OBJ_OFS_DELTA = 6,
|
|
|
|
OBJ_REF_DELTA = 7,
|
2006-09-04 06:09:18 +02:00
|
|
|
OBJ_BAD,
|
|
|
|
};
|
|
|
|
|
2006-09-21 01:04:46 +02:00
|
|
|
extern signed char hexval_table[256];
|
|
|
|
static inline unsigned int hexval(unsigned int c)
|
|
|
|
{
|
|
|
|
return hexval_table[c];
|
|
|
|
}
|
|
|
|
|
2005-04-08 00:13:13 +02:00
|
|
|
/* Convert to/from hex/sha1 representation */
|
2006-01-25 10:03:18 +01:00
|
|
|
#define MINIMUM_ABBREV 4
|
|
|
|
#define DEFAULT_ABBREV 7
|
|
|
|
|
2005-05-02 01:36:56 +02:00
|
|
|
extern int get_sha1(const char *str, unsigned char *sha1);
|
2005-04-09 21:09:27 +02:00
|
|
|
extern int get_sha1_hex(const char *hex, unsigned char *sha1);
|
|
|
|
extern char *sha1_to_hex(const unsigned char *sha1); /* static buffer result! */
|
2005-09-25 18:59:37 +02:00
|
|
|
extern int read_ref(const char *filename, unsigned char *sha1);
|
2006-09-21 07:02:01 +02:00
|
|
|
extern const char *resolve_ref(const char *path, unsigned char *sha1, int, int *);
|
2007-01-19 10:15:15 +01:00
|
|
|
extern int dwim_ref(const char *str, int len, unsigned char *sha1, char **ref);
|
2007-02-09 01:28:23 +01:00
|
|
|
extern int dwim_log(const char *str, int len, unsigned char *sha1, char **ref);
|
2007-01-19 10:15:15 +01:00
|
|
|
|
2007-01-26 23:26:10 +01:00
|
|
|
extern int create_symref(const char *ref, const char *refs_heads_master, const char *logmsg);
|
2007-01-02 08:31:08 +01:00
|
|
|
extern int validate_headref(const char *ref);
|
2005-04-08 00:13:13 +02:00
|
|
|
|
2005-05-20 18:09:18 +02:00
|
|
|
extern int base_name_compare(const char *name1, int len1, int mode1, const char *name2, int len2, int mode2);
|
2005-04-09 21:59:11 +02:00
|
|
|
extern int cache_name_compare(const char *name1, int len1, const char *name2, int len2);
|
2005-04-08 00:13:13 +02:00
|
|
|
|
2005-04-29 01:42:27 +02:00
|
|
|
extern void *read_object_with_reference(const unsigned char *sha1,
|
2005-05-18 14:14:09 +02:00
|
|
|
const char *required_type,
|
2005-04-29 01:42:27 +02:00
|
|
|
unsigned long *size,
|
|
|
|
unsigned char *sha1_ret);
|
2005-04-21 03:06:49 +02:00
|
|
|
|
2006-08-27 00:45:26 +02:00
|
|
|
const char *show_date(unsigned long time, int timezone, int relative);
|
2006-05-01 10:44:33 +02:00
|
|
|
const char *show_rfc2822_date(unsigned long time, int timezone);
|
2005-09-20 00:53:50 +02:00
|
|
|
int parse_date(const char *date, char *buf, int bufsize);
|
2005-04-30 18:46:49 +02:00
|
|
|
void datestamp(char *buf, int bufsize);
|
git's rev-parse.c function show_datestring presumes gnu date
Ok. This is the insane patch to do this.
It really isn't very careful, and the reason I call it "approxidate()"
will become obvious when you look at the code. It is very liberal in what
it accepts, to the point where sometimes the results may not make a whole
lot of sense.
It accepts "last week" as a date string, by virtue of "last" parsing as
the number 1, and it totally ignoring superfluous fluff like "ago", so
"last week" ends up being exactly the same thing as "1 week ago". Fine so
far.
It has strange side effects: "last december" will actually parse as "Dec
1", which actually _does_ turn out right, because it will then notice that
it's not December yet, so it will decide that you must be talking about a
date last year. So it actually gets it right, but it's kind of for the
"wrong" reasons.
It also accepts the numbers 1..10 in string format ("one" .. "ten"), so
you can do "ten weeks ago" or "ten hours ago" and it will do the right
thing.
But it will do some really strange thigns too: the string "this will last
forever", will not recognize anyting but "last", which is recognized as
"1", which since it doesn't understand anything else it will think is the
day of the month. So if you do
gitk --since="this will last forever"
the date will actually parse as the first day of the current month.
And it will parse the string "now" as "now", but only because it doesn't
understand it at all, and it makes everything relative to "now".
Similarly, it doesn't actually parse the "ago" or "from now", so "2 weeks
ago" is exactly the same as "2 weeks from now". It's the current date
minus 14 days.
But hey, it's probably better (and certainly faster) than depending on GNU
date. So now you can portably do things like
gitk --since="two weeks and three days ago"
git log --since="July 5"
git-whatchanged --since="10 hours ago"
git log --since="last october"
and it will actually do exactly what you thought it would do (I think). It
will count 17 days backwards, and it will do so even if you don't have GNU
date installed.
(I don't do "last monday" or similar yet, but I can extend it to that too
if people want).
It was kind of fun trying to write code that uses such totally relaxed
"understanding" of dates yet tries to get it right for the trivial cases.
The result should be mixed with a few strange preprocessor tricks, and be
submitted for the IOCCC ;)
Feel free to try it out, and see how many strange dates it gets right. Or
wrong.
And if you find some interesting (and valid - not "interesting" as in
"strange", but "interesting" as in "I'd be interested in actually doing
this) thing it gets wrong - usually by not understanding it and silently
just doing some strange things - please holler.
Now, as usual this certainly hasn't been getting a lot of testing. But my
code always works, no?
Linus
Signed-off-by: Junio C Hamano <junkio@cox.net>
2005-11-15 04:29:06 +01:00
|
|
|
unsigned long approxidate(const char *);
|
2005-04-30 18:46:49 +02:00
|
|
|
|
2006-02-19 05:31:05 +01:00
|
|
|
extern const char *git_author_info(int);
|
|
|
|
extern const char *git_committer_info(int);
|
2007-02-05 02:50:14 +01:00
|
|
|
extern const char *fmt_ident(const char *name, const char *email, const char *date_str, int);
|
2005-07-12 20:49:27 +02:00
|
|
|
|
2005-06-06 06:59:54 +02:00
|
|
|
struct checkout {
|
|
|
|
const char *base_dir;
|
|
|
|
int base_dir_len;
|
|
|
|
unsigned force:1,
|
|
|
|
quiet:1,
|
|
|
|
not_new:1,
|
|
|
|
refresh_cache:1;
|
|
|
|
};
|
|
|
|
|
2006-03-05 09:24:15 +01:00
|
|
|
extern int checkout_entry(struct cache_entry *ce, struct checkout *state, char *topath);
|
2005-06-06 06:59:54 +02:00
|
|
|
|
2005-06-28 23:56:57 +02:00
|
|
|
extern struct alternate_object_database {
|
2005-08-15 02:25:57 +02:00
|
|
|
struct alternate_object_database *next;
|
2005-06-28 23:56:57 +02:00
|
|
|
char *name;
|
2006-01-07 10:33:54 +01:00
|
|
|
char base[FLEX_ARRAY]; /* more */
|
2005-08-15 02:25:57 +02:00
|
|
|
} *alt_odb_list;
|
2005-06-28 23:56:57 +02:00
|
|
|
extern void prepare_alt_odb(void);
|
|
|
|
|
2006-12-23 08:33:44 +01:00
|
|
|
struct pack_window {
|
|
|
|
struct pack_window *next;
|
|
|
|
unsigned char *base;
|
|
|
|
off_t offset;
|
|
|
|
size_t len;
|
|
|
|
unsigned int last_used;
|
|
|
|
unsigned int inuse_cnt;
|
|
|
|
};
|
|
|
|
|
2005-06-28 23:56:57 +02:00
|
|
|
extern struct packed_git {
|
|
|
|
struct packed_git *next;
|
2006-12-23 08:33:44 +01:00
|
|
|
struct pack_window *windows;
|
2007-01-18 08:17:28 +01:00
|
|
|
uint32_t *index_base;
|
2006-12-23 08:33:47 +01:00
|
|
|
off_t index_size;
|
|
|
|
off_t pack_size;
|
2006-12-23 08:34:01 +01:00
|
|
|
int pack_fd;
|
2005-10-14 00:38:28 +02:00
|
|
|
int pack_local;
|
2005-08-01 02:53:44 +02:00
|
|
|
unsigned char sha1[20];
|
2006-01-07 10:33:54 +01:00
|
|
|
/* something like ".git/objects/pack/xxxxx.pack" */
|
|
|
|
char pack_name[FLEX_ARRAY]; /* more */
|
2005-06-28 23:56:57 +02:00
|
|
|
} *packed_git;
|
2005-07-01 02:15:39 +02:00
|
|
|
|
|
|
|
struct pack_entry {
|
|
|
|
unsigned int offset;
|
|
|
|
unsigned char sha1[20];
|
|
|
|
struct packed_git *p;
|
|
|
|
};
|
|
|
|
|
2005-07-16 22:55:50 +02:00
|
|
|
struct ref {
|
|
|
|
struct ref *next;
|
|
|
|
unsigned char old_sha1[20];
|
|
|
|
unsigned char new_sha1[20];
|
2005-08-24 09:40:14 +02:00
|
|
|
unsigned char force;
|
2005-08-04 01:35:29 +02:00
|
|
|
struct ref *peer_ref; /* when renaming */
|
2006-01-07 10:33:54 +01:00
|
|
|
char name[FLEX_ARRAY]; /* more */
|
2005-07-16 22:55:50 +02:00
|
|
|
};
|
|
|
|
|
Improve git-peek-remote
This makes git-peek-remote able to basically do everything that
git-ls-remote does (but obviously just for the native protocol, so no
http[s]: or rsync: support).
The default behaviour is the same, but you can now give a mixture of
"--refs", "--tags" and "--heads" flags, where "--refs" forces
git-peek-remote to only show real refs (ie none of the fakey tag lookups,
but also not the special pseudo-refs like HEAD and MERGE_HEAD).
The "--tags" and "--heads" flags respectively limit the output to just
regular tags and heads, of course.
You can still also ask to limit them by name too.
You can combine the flags, so
git peek-remote --refs --tags .
will show all local _true_ tags, without the generated tag lookups
(compare the output without the "--refs" flag).
And "--tags --heads" will show both tags and heads, but will avoid (for
example) any special refs outside of the standard locations.
I'm also planning on adding a "--ignore-local" flag that allows us to ask
it to ignore any refs that we already have in the local tree, but that's
an independent thing.
All this is obviously gearing up to making "git fetch" cheaper.
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Signed-off-by: Junio C Hamano <junkio@cox.net>
2006-07-04 21:29:10 +02:00
|
|
|
#define REF_NORMAL (1u << 0)
|
|
|
|
#define REF_HEADS (1u << 1)
|
|
|
|
#define REF_TAGS (1u << 2)
|
|
|
|
|
2006-09-12 11:00:13 +02:00
|
|
|
extern pid_t git_connect(int fd[2], char *url, const char *prog);
|
2005-07-04 20:57:58 +02:00
|
|
|
extern int finish_connect(pid_t pid);
|
2005-07-04 22:24:30 +02:00
|
|
|
extern int path_match(const char *path, int nr, char **match);
|
2005-08-04 01:35:29 +02:00
|
|
|
extern int match_refs(struct ref *src, struct ref *dst, struct ref ***dst_tail,
|
|
|
|
int nr_refspec, char **refspec, int all);
|
2005-07-06 00:44:09 +02:00
|
|
|
extern int get_ack(int fd, unsigned char *result_sha1);
|
Improve git-peek-remote
This makes git-peek-remote able to basically do everything that
git-ls-remote does (but obviously just for the native protocol, so no
http[s]: or rsync: support).
The default behaviour is the same, but you can now give a mixture of
"--refs", "--tags" and "--heads" flags, where "--refs" forces
git-peek-remote to only show real refs (ie none of the fakey tag lookups,
but also not the special pseudo-refs like HEAD and MERGE_HEAD).
The "--tags" and "--heads" flags respectively limit the output to just
regular tags and heads, of course.
You can still also ask to limit them by name too.
You can combine the flags, so
git peek-remote --refs --tags .
will show all local _true_ tags, without the generated tag lookups
(compare the output without the "--refs" flag).
And "--tags --heads" will show both tags and heads, but will avoid (for
example) any special refs outside of the standard locations.
I'm also planning on adding a "--ignore-local" flag that allows us to ask
it to ignore any refs that we already have in the local tree, but that's
an independent thing.
All this is obviously gearing up to making "git fetch" cheaper.
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Signed-off-by: Junio C Hamano <junkio@cox.net>
2006-07-04 21:29:10 +02:00
|
|
|
extern struct ref **get_remote_heads(int in, struct ref **list, int nr_match, char **match, unsigned int flags);
|
2005-10-28 04:48:54 +02:00
|
|
|
extern int server_supports(const char *feature);
|
2005-07-04 20:57:58 +02:00
|
|
|
|
2005-08-01 02:53:44 +02:00
|
|
|
extern struct packed_git *parse_pack_index(unsigned char *sha1);
|
2005-09-02 14:17:10 +02:00
|
|
|
extern struct packed_git *parse_pack_index_file(const unsigned char *sha1,
|
2005-08-16 06:10:03 +02:00
|
|
|
char *idx_path);
|
2005-08-01 02:53:44 +02:00
|
|
|
|
2005-06-28 23:56:57 +02:00
|
|
|
extern void prepare_packed_git(void);
|
2006-11-01 23:06:21 +01:00
|
|
|
extern void reprepare_packed_git(void);
|
2005-08-01 02:53:44 +02:00
|
|
|
extern void install_packed_git(struct packed_git *pack);
|
|
|
|
|
|
|
|
extern struct packed_git *find_sha1_pack(const unsigned char *sha1,
|
|
|
|
struct packed_git *packs);
|
|
|
|
|
2007-01-17 07:28:02 +01:00
|
|
|
extern void pack_report(void);
|
2006-12-23 08:34:08 +01:00
|
|
|
extern unsigned char* use_pack(struct packed_git *, struct pack_window **, unsigned long, unsigned int *);
|
|
|
|
extern void unuse_pack(struct pack_window **);
|
2005-10-14 00:38:28 +02:00
|
|
|
extern struct packed_git *add_packed_git(char *, int, int);
|
2005-06-28 23:56:57 +02:00
|
|
|
extern int num_packed_objects(const struct packed_git *p);
|
|
|
|
extern int nth_packed_object_sha1(const struct packed_git *, int, unsigned char*);
|
2006-09-21 06:05:37 +02:00
|
|
|
extern unsigned long find_pack_entry_one(const unsigned char *, struct packed_git *);
|
2006-12-23 08:33:25 +01:00
|
|
|
extern void *unpack_entry(struct packed_git *, unsigned long, char *, unsigned long *);
|
2006-09-04 06:09:18 +02:00
|
|
|
extern unsigned long unpack_object_header_gently(const unsigned char *buf, unsigned long len, enum object_type *type, unsigned long *sizep);
|
2006-09-21 06:05:37 +02:00
|
|
|
extern void packed_object_info_detail(struct packed_git *, unsigned long, char *, unsigned long *, unsigned long *, unsigned int *, unsigned char *);
|
2005-06-28 23:56:57 +02:00
|
|
|
|
[PATCH] Add update-server-info.
The git-update-server-info command prepares informational files
to help clients discover the contents of a repository, and pull
from it via a dumb transport protocols. Currently, the
following files are produced.
- The $repo/info/refs file lists the name of heads and tags
available in the $repo/refs/ directory, along with their
SHA1. This can be used by git-ls-remote command running on
the client side.
- The $repo/info/rev-cache file describes the commit ancestry
reachable from references in the $repo/refs/ directory. This
file is in an append-only binary format to make the server
side friendly to rsync mirroring scheme, and can be read by
git-show-rev-cache command.
- The $repo/objects/info/pack file lists the name of the packs
available, the interdependencies among them, and the head
commits and tags contained in them. Along with the other two
files, this is designed to help clients to make smart pull
decisions.
The git-receive-pack command is changed to invoke it at the end,
so just after a push to a public repository finishes via "git
push", the server info is automatically updated.
In addition, building of the rev-cache file can be done by a
standalone git-build-rev-cache command separately.
Signed-off-by: Junio C Hamano <junkio@cox.net>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
2005-07-24 02:54:41 +02:00
|
|
|
/* Dumb servers support */
|
|
|
|
extern int update_server_info(int);
|
|
|
|
|
2005-10-11 01:31:08 +02:00
|
|
|
typedef int (*config_fn_t)(const char *, const char *);
|
|
|
|
extern int git_default_config(const char *, const char *);
|
2005-11-26 01:03:56 +01:00
|
|
|
extern int git_config_from_file(config_fn_t fn, const char *);
|
2005-10-11 01:31:08 +02:00
|
|
|
extern int git_config(config_fn_t fn);
|
|
|
|
extern int git_config_int(const char *, const char *);
|
|
|
|
extern int git_config_bool(const char *, const char *);
|
2005-11-17 22:32:36 +01:00
|
|
|
extern int git_config_set(const char *, const char *);
|
2005-11-20 06:52:22 +01:00
|
|
|
extern int git_config_set_multivar(const char *, const char *, const char *, int);
|
2006-12-16 15:14:14 +01:00
|
|
|
extern int git_config_rename_section(const char *, const char *);
|
2005-11-26 00:59:09 +01:00
|
|
|
extern int check_repository_format_version(const char *var, const char *value);
|
2005-10-11 01:31:08 +02:00
|
|
|
|
2005-10-12 03:47:34 +02:00
|
|
|
#define MAX_GITNAME (1000)
|
|
|
|
extern char git_default_email[MAX_GITNAME];
|
|
|
|
extern char git_default_name[MAX_GITNAME];
|
|
|
|
|
2006-12-28 01:41:33 +01:00
|
|
|
extern char *git_commit_encoding;
|
|
|
|
extern char *git_log_output_encoding;
|
2005-11-28 01:09:40 +01:00
|
|
|
|
2005-10-22 10:28:13 +02:00
|
|
|
extern int copy_fd(int ifd, int ofd);
|
2007-01-08 16:58:08 +01:00
|
|
|
extern int read_in_full(int fd, void *buf, size_t count);
|
2007-01-08 16:57:52 +01:00
|
|
|
extern int write_in_full(int fd, const void *buf, size_t count);
|
2006-08-21 20:43:43 +02:00
|
|
|
extern void write_or_die(int fd, const void *buf, size_t count);
|
2006-09-02 18:23:48 +02:00
|
|
|
extern int write_or_whine(int fd, const void *buf, size_t count, const char *msg);
|
2007-01-08 16:57:52 +01:00
|
|
|
extern int write_or_whine_pipe(int fd, const void *buf, size_t count, const char *msg);
|
2005-12-15 07:17:38 +01:00
|
|
|
|
2006-02-28 20:26:21 +01:00
|
|
|
/* pager.c */
|
|
|
|
extern void setup_pager(void);
|
2006-06-07 01:58:40 +02:00
|
|
|
extern int pager_in_use;
|
2006-07-30 00:27:43 +02:00
|
|
|
extern int pager_use_color;
|
2006-02-28 20:26:21 +01:00
|
|
|
|
binary patch.
This adds "binary patch" to the diff output and teaches apply
what to do with them.
On the diff generation side, traditionally, we said "Binary
files differ\n" without giving anything other than the preimage
and postimage object name on the index line. This was good
enough for applying a patch generated from your own repository
(very useful while rebasing), because the postimage would be
available in such a case. However, this was not useful when the
recipient of such a patch via e-mail were to apply it, even if
the preimage was available.
This patch allows the diff to generate "binary" patch when
operating under --full-index option. The binary patch follows
the usual extended git diff headers, and looks like this:
"GIT binary patch\n"
<length byte><data>"\n"
...
"\n"
Each line is prefixed with a "length-byte", whose value is upper
or lowercase alphabet that encodes number of bytes that the data
on the line decodes to (1..52 -- 'A' means 1, 'B' means 2, ...,
'Z' means 26, 'a' means 27, ...). <data> is 1 or more groups of
5-byte sequence, each of which encodes up to 4 bytes in base85
encoding. Because 52 / 4 * 5 = 65 and we have the length byte,
an output line is capped to 66 characters. The payload is the
same diff-delta as we use in the packfiles.
On the consumption side, git-apply now can decode and apply the
binary patch when --allow-binary-replacement is given, the diff
was generated with --full-index, and the receiving repository
has the preimage blob, which is the same condition as it always
required when accepting an "Binary files differ\n" patch.
Signed-off-by: Junio C Hamano <junkio@cox.net>
2006-05-05 01:51:44 +02:00
|
|
|
/* base85 */
|
|
|
|
int decode_85(char *dst, char *line, int linelen);
|
2006-05-05 11:41:53 +02:00
|
|
|
void encode_85(char *buf, unsigned char *data, int bytes);
|
binary patch.
This adds "binary patch" to the diff output and teaches apply
what to do with them.
On the diff generation side, traditionally, we said "Binary
files differ\n" without giving anything other than the preimage
and postimage object name on the index line. This was good
enough for applying a patch generated from your own repository
(very useful while rebasing), because the postimage would be
available in such a case. However, this was not useful when the
recipient of such a patch via e-mail were to apply it, even if
the preimage was available.
This patch allows the diff to generate "binary" patch when
operating under --full-index option. The binary patch follows
the usual extended git diff headers, and looks like this:
"GIT binary patch\n"
<length byte><data>"\n"
...
"\n"
Each line is prefixed with a "length-byte", whose value is upper
or lowercase alphabet that encodes number of bytes that the data
on the line decodes to (1..52 -- 'A' means 1, 'B' means 2, ...,
'Z' means 26, 'a' means 27, ...). <data> is 1 or more groups of
5-byte sequence, each of which encodes up to 4 bytes in base85
encoding. Because 52 / 4 * 5 = 65 and we have the length byte,
an output line is capped to 66 characters. The payload is the
same diff-delta as we use in the packfiles.
On the consumption side, git-apply now can decode and apply the
binary patch when --allow-binary-replacement is given, the diff
was generated with --full-index, and the receiving repository
has the preimage blob, which is the same condition as it always
required when accepting an "Binary files differ\n" patch.
Signed-off-by: Junio C Hamano <junkio@cox.net>
2006-05-05 01:51:44 +02:00
|
|
|
|
Add specialized object allocator
This creates a simple specialized object allocator for basic
objects.
This avoids wasting space with malloc overhead (metadata and
extra alignment), since the specialized allocator knows the
alignment, and that objects, once allocated, are never freed.
It also allows us to track some basic statistics about object
allocations. For example, for the mozilla import, it shows
object usage as follows:
blobs: 627629 (14710 kB)
trees: 1119035 (34969 kB)
commits: 196423 (8440 kB)
tags: 1336 (46 kB)
and the simpler allocator shaves off about 2.5% off the memory
footprint off a "git-rev-list --all --objects", and is a bit
faster too.
[ Side note: this concludes the series of "save memory in object storage".
The thing is, there simply isn't much more to be saved on the objects.
Doing "git-rev-list --all --objects" on the mozilla archive has a final
total RSS of 131498 pages for me: that's about 513MB. Of that, the
object overhead is now just 56MB, the rest is going somewhere else (put
another way: the fact that this patch shaves off 2.5% of the total
memory overhead, considering that objects are now not much more than 10%
of the total shows how big the wasted space really was: this makes
object allocations much more memory- and time-efficient).
I haven't looked at where the rest is, but I suspect the bulk of it is
just the pack-file loading. It may be that we should pack the tree
objects separately from the blob objects: for git-rev-list --objects, we
don't actually ever need to even look at the blobs, but since trees and
blobs are interspersed in the pack-file, we end up not being dense in
the tree accesses, so we end up looking at more pages than we strictly
need to.
So with a 535MB pack-file, it's entirely possible - even likely - that
most of the remaining RSS is just the mmap of the pack-file itself. We
don't need to map in _all_ of it, but we do end up mapping a fair
amount. ]
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Signed-off-by: Junio C Hamano <junkio@cox.net>
2006-06-19 19:44:15 +02:00
|
|
|
/* alloc.c */
|
|
|
|
struct blob;
|
|
|
|
struct tree;
|
|
|
|
struct commit;
|
|
|
|
struct tag;
|
|
|
|
extern struct blob *alloc_blob_node(void);
|
|
|
|
extern struct tree *alloc_tree_node(void);
|
|
|
|
extern struct commit *alloc_commit_node(void);
|
|
|
|
extern struct tag *alloc_tag_node(void);
|
|
|
|
extern void alloc_report(void);
|
|
|
|
|
2006-09-02 18:23:48 +02:00
|
|
|
/* trace.c */
|
|
|
|
extern int nfvasprintf(char **str, const char *fmt, va_list va);
|
|
|
|
extern void trace_printf(const char *format, ...);
|
|
|
|
extern void trace_argv_printf(const char **argv, int count, const char *format, ...);
|
|
|
|
|
Lazy man's auto-CRLF
It currently does NOT know about file attributes, so it does its
conversion purely based on content. Maybe that is more in the "git
philosophy" anyway, since content is king, but I think we should try to do
the file attributes to turn it off on demand.
Anyway, BY DEFAULT it is off regardless, because it requires a
[core]
AutoCRLF = true
in your config file to be enabled. We could make that the default for
Windows, of course, the same way we do some other things (filemode etc).
But you can actually enable it on UNIX, and it will cause:
- "git update-index" will write blobs without CRLF
- "git diff" will diff working tree files without CRLF
- "git checkout" will write files to the working tree _with_ CRLF
and things work fine.
Funnily, it actually shows an odd file in git itself:
git clone -n git test-crlf
cd test-crlf
git config core.autocrlf true
git checkout
git diff
shows a diff for "Documentation/docbook-xsl.css". Why? Because we have
actually checked in that file *with* CRLF! So when "core.autocrlf" is
true, we'll always generate a *different* hash for it in the index,
because the index hash will be for the content _without_ CRLF.
Is this complete? I dunno. It seems to work for me. It doesn't use the
filename at all right now, and that's probably a deficiency (we could
certainly make the "is_binary()" heuristics also take standard filename
heuristics into account).
I don't pass in the filename at all for the "index_fd()" case
(git-update-index), so that would need to be passed around, but this
actually works fine.
NOTE NOTE NOTE! The "is_binary()" heuristics are totally made-up by yours
truly. I will not guarantee that they work at all reasonable. Caveat
emptor. But it _is_ simple, and it _is_ safe, since it's all off by
default.
The patch is pretty simple - the biggest part is the new "convert.c" file,
but even that is really just basic stuff that anybody can write in
"Teaching C 101" as a final project for their first class in programming.
Not to say that it's bug-free, of course - but at least we're not talking
about rocket surgery here.
Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org>
Signed-off-by: Junio C Hamano <junkio@cox.net>
2007-02-13 20:07:23 +01:00
|
|
|
/* convert.c */
|
|
|
|
extern int convert_to_git(const char *path, char **bufp, unsigned long *sizep);
|
|
|
|
extern int convert_to_working_tree(const char *path, char **bufp, unsigned long *sizep);
|
|
|
|
|
2005-04-08 00:13:13 +02:00
|
|
|
#endif /* CACHE_H */
|