blob: 90e7900e6d7aff2fadf9ba04f8d982733493411c [file] [log] [blame]
Linus Torvaldsd98b46f2005-04-20 01:10:46 -07001#include "cache.h"
Peter Eriksen8e440252006-04-02 14:44:09 +02002#include "blob.h"
3#include "commit.h"
4#include "tree.h"
Linus Torvaldsd98b46f2005-04-20 01:10:46 -07005
6struct entry {
7 unsigned char old_sha1[20];
8 unsigned char new_sha1[20];
9 int converted;
10};
11
12#define MAXOBJECTS (1000000)
13
14static struct entry *convert[MAXOBJECTS];
15static int nr_convert;
16
17static struct entry * convert_entry(unsigned char *sha1);
18
19static struct entry *insert_new(unsigned char *sha1, int pos)
20{
Peter Eriksen90321c12006-04-03 19:30:46 +010021 struct entry *new = xcalloc(1, sizeof(struct entry));
Shawn Pearcee7024962006-08-23 02:49:00 -040022 hashcpy(new->old_sha1, sha1);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -070023 memmove(convert + pos + 1, convert + pos, (nr_convert - pos) * sizeof(struct entry *));
24 convert[pos] = new;
25 nr_convert++;
26 if (nr_convert == MAXOBJECTS)
27 die("you're kidding me - hit maximum object limit");
28 return new;
29}
30
31static struct entry *lookup_entry(unsigned char *sha1)
32{
33 int low = 0, high = nr_convert;
34
35 while (low < high) {
36 int next = (low + high) / 2;
37 struct entry *n = convert[next];
David Rientjesa89fccd2006-08-17 11:54:57 -070038 int cmp = hashcmp(sha1, n->old_sha1);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -070039 if (!cmp)
40 return n;
41 if (cmp < 0) {
42 high = next;
43 continue;
44 }
45 low = next+1;
46 }
47 return insert_new(sha1, low);
48}
49
Linus Torvaldsd98b46f2005-04-20 01:10:46 -070050static void convert_binary_sha1(void *buffer)
51{
52 struct entry *entry = convert_entry(buffer);
Shawn Pearcee7024962006-08-23 02:49:00 -040053 hashcpy(buffer, entry->new_sha1);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -070054}
55
56static void convert_ascii_sha1(void *buffer)
57{
58 unsigned char sha1[20];
59 struct entry *entry;
60
61 if (get_sha1_hex(buffer, sha1))
Junio C Hamano79db12e2005-08-09 21:25:46 -070062 die("expected sha1, got '%s'", (char*) buffer);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -070063 entry = convert_entry(sha1);
64 memcpy(buffer, sha1_to_hex(entry->new_sha1), 40);
65}
66
Linus Torvalds4e813042005-07-27 15:29:38 -070067static unsigned int convert_mode(unsigned int mode)
68{
69 unsigned int newmode;
70
71 newmode = mode & S_IFMT;
72 if (S_ISREG(mode))
73 newmode |= (mode & 0100) ? 0755 : 0644;
74 return newmode;
75}
76
Linus Torvaldsbfac5d92005-04-23 16:37:31 -070077static int write_subdirectory(void *buffer, unsigned long size, const char *base, int baselen, unsigned char *result_sha1)
78{
Christopher Li812666c2005-04-26 12:00:58 -070079 char *new = xmalloc(size);
Linus Torvaldsa44c9a52005-04-25 10:19:53 -070080 unsigned long newlen = 0;
Linus Torvaldsbfac5d92005-04-23 16:37:31 -070081 unsigned long used;
Linus Torvaldsbfac5d92005-04-23 16:37:31 -070082
83 used = 0;
84 while (size) {
85 int len = 21 + strlen(buffer);
86 char *path = strchr(buffer, ' ');
87 unsigned char *sha1;
88 unsigned int mode;
89 char *slash, *origpath;
90
Andy Whitcroft6e6db392007-04-19 03:08:15 +010091 if (!path || strtoul_ui(buffer, 8, &mode))
Linus Torvaldsbfac5d92005-04-23 16:37:31 -070092 die("bad tree conversion");
Linus Torvalds4e813042005-07-27 15:29:38 -070093 mode = convert_mode(mode);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -070094 path++;
95 if (memcmp(path, base, baselen))
96 break;
97 origpath = path;
98 path += baselen;
99 slash = strchr(path, '/');
100 if (!slash) {
101 newlen += sprintf(new + newlen, "%o %s", mode, path);
102 new[newlen++] = '\0';
Shawn Pearcee7024962006-08-23 02:49:00 -0400103 hashcpy((unsigned char*)new + newlen, (unsigned char *) buffer + len - 20);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700104 newlen += 20;
105
106 used += len;
107 size -= len;
Florian Forster1d7f1712006-06-18 17:18:09 +0200108 buffer = (char *) buffer + len;
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700109 continue;
110 }
111
tony.luck@intel.comf220fb62005-05-02 10:57:02 -0700112 newlen += sprintf(new + newlen, "%o %.*s", S_IFDIR, (int)(slash - path), path);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700113 new[newlen++] = 0;
114 sha1 = (unsigned char *)(new + newlen);
115 newlen += 20;
116
117 len = write_subdirectory(buffer, size, origpath, slash-origpath+1, sha1);
118
119 used += len;
120 size -= len;
Florian Forster1d7f1712006-06-18 17:18:09 +0200121 buffer = (char *) buffer + len;
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700122 }
123
Peter Eriksen8e440252006-04-02 14:44:09 +0200124 write_sha1_file(new, newlen, tree_type, result_sha1);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700125 free(new);
126 return used;
127}
128
129static void convert_tree(void *buffer, unsigned long size, unsigned char *result_sha1)
130{
131 void *orig_buffer = buffer;
132 unsigned long orig_size = size;
133
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700134 while (size) {
Shawn O. Pearce3a556022007-03-06 20:44:17 -0500135 size_t len = 1+strlen(buffer);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700136
Florian Forster1d7f1712006-06-18 17:18:09 +0200137 convert_binary_sha1((char *) buffer + len);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700138
139 len += 20;
140 if (len > size)
141 die("corrupt tree object");
142 size -= len;
Florian Forster1d7f1712006-06-18 17:18:09 +0200143 buffer = (char *) buffer + len;
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700144 }
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700145
146 write_subdirectory(orig_buffer, orig_size, "", 0, result_sha1);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700147}
148
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700149static unsigned long parse_oldstyle_date(const char *buf)
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700150{
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700151 char c, *p;
152 char buffer[100];
153 struct tm tm;
154 const char *formats[] = {
155 "%c",
156 "%a %b %d %T",
157 "%Z",
158 "%Y",
159 " %Y",
160 NULL
161 };
162 /* We only ever did two timezones in the bad old format .. */
163 const char *timezones[] = {
Linus Torvalds3f053892005-04-24 15:49:09 -0700164 "PDT", "PST", "CEST", NULL
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700165 };
166 const char **fmt = formats;
167
168 p = buffer;
169 while (isspace(c = *buf))
170 buf++;
171 while ((c = *buf++) != '\n')
172 *p++ = c;
173 *p++ = 0;
174 buf = buffer;
175 memset(&tm, 0, sizeof(tm));
176 do {
177 const char *next = strptime(buf, *fmt, &tm);
178 if (next) {
179 if (!*next)
180 return mktime(&tm);
181 buf = next;
182 } else {
183 const char **p = timezones;
184 while (isspace(*buf))
185 buf++;
186 while (*p) {
187 if (!memcmp(buf, *p, strlen(*p))) {
188 buf += strlen(*p);
189 break;
190 }
191 p++;
192 }
193 }
194 fmt++;
195 } while (*buf && *fmt);
196 printf("left: %s\n", buf);
Junio C Hamanoa6080a02007-06-07 00:04:01 -0700197 return mktime(&tm);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700198}
199
200static int convert_date_line(char *dst, void **buf, unsigned long *sp)
201{
202 unsigned long size = *sp;
203 char *line = *buf;
204 char *next = strchr(line, '\n');
205 char *date = strchr(line, '>');
206 int len;
207
208 if (!next || !date)
209 die("missing or bad author/committer line %s", line);
210 next++; date += 2;
211
212 *buf = next;
213 *sp = size - (next - line);
214
215 len = date - line;
216 memcpy(dst, line, len);
217 dst += len;
218
219 /* Is it already in new format? */
220 if (isdigit(*date)) {
221 int datelen = next - date;
222 memcpy(dst, date, datelen);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700223 return len + datelen;
224 }
225
Linus Torvalds93256312005-04-23 16:48:32 -0700226 /*
227 * Hacky hacky: one of the sparse old-style commits does not have
228 * any date at all, but we can fake it by using the committer date.
229 */
230 if (*date == '\n' && strchr(next, '>'))
231 date = strchr(next, '>')+2;
232
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700233 return len + sprintf(dst, "%lu -0700\n", parse_oldstyle_date(date));
234}
235
236static void convert_date(void *buffer, unsigned long size, unsigned char *result_sha1)
237{
Christopher Li812666c2005-04-26 12:00:58 -0700238 char *new = xmalloc(size + 100);
Linus Torvaldsa44c9a52005-04-25 10:19:53 -0700239 unsigned long newlen = 0;
Pavel Roskina9486b02006-07-10 02:57:51 -0400240
241 /* "tree <sha1>\n" */
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700242 memcpy(new + newlen, buffer, 46);
243 newlen += 46;
Florian Forster1d7f1712006-06-18 17:18:09 +0200244 buffer = (char *) buffer + 46;
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700245 size -= 46;
246
Pavel Roskina9486b02006-07-10 02:57:51 -0400247 /* "parent <sha1>\n" */
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700248 while (!memcmp(buffer, "parent ", 7)) {
249 memcpy(new + newlen, buffer, 48);
250 newlen += 48;
Florian Forster1d7f1712006-06-18 17:18:09 +0200251 buffer = (char *) buffer + 48;
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700252 size -= 48;
253 }
254
Pavel Roskina9486b02006-07-10 02:57:51 -0400255 /* "author xyz <xyz> date" */
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700256 newlen += convert_date_line(new + newlen, &buffer, &size);
Pavel Roskina9486b02006-07-10 02:57:51 -0400257 /* "committer xyz <xyz> date" */
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700258 newlen += convert_date_line(new + newlen, &buffer, &size);
259
Pavel Roskina9486b02006-07-10 02:57:51 -0400260 /* Rest */
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700261 memcpy(new + newlen, buffer, size);
262 newlen += size;
263
Peter Eriksen8e440252006-04-02 14:44:09 +0200264 write_sha1_file(new, newlen, commit_type, result_sha1);
265 free(new);
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700266}
267
268static void convert_commit(void *buffer, unsigned long size, unsigned char *result_sha1)
269{
270 void *orig_buffer = buffer;
271 unsigned long orig_size = size;
272
Linus Torvalds4e813042005-07-27 15:29:38 -0700273 if (memcmp(buffer, "tree ", 5))
Junio C Hamano79db12e2005-08-09 21:25:46 -0700274 die("Bad commit '%s'", (char*) buffer);
Florian Forster1d7f1712006-06-18 17:18:09 +0200275 convert_ascii_sha1((char *) buffer + 5);
276 buffer = (char *) buffer + 46; /* "tree " + "hex sha1" + "\n" */
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700277 while (!memcmp(buffer, "parent ", 7)) {
Florian Forster1d7f1712006-06-18 17:18:09 +0200278 convert_ascii_sha1((char *) buffer + 7);
279 buffer = (char *) buffer + 48;
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700280 }
Linus Torvaldsbfac5d92005-04-23 16:37:31 -0700281 convert_date(orig_buffer, orig_size, result_sha1);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700282}
283
284static struct entry * convert_entry(unsigned char *sha1)
285{
286 struct entry *entry = lookup_entry(sha1);
Nicolas Pitre21666f12007-02-26 14:55:59 -0500287 enum object_type type;
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700288 void *buffer, *data;
Linus Torvaldsa44c9a52005-04-25 10:19:53 -0700289 unsigned long size;
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700290
291 if (entry->converted)
292 return entry;
Nicolas Pitre21666f12007-02-26 14:55:59 -0500293 data = read_sha1_file(sha1, &type, &size);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700294 if (!data)
295 die("unable to read object %s", sha1_to_hex(sha1));
296
Christopher Li812666c2005-04-26 12:00:58 -0700297 buffer = xmalloc(size);
Linus Torvaldsa44c9a52005-04-25 10:19:53 -0700298 memcpy(buffer, data, size);
Peter Eriksen8e440252006-04-02 14:44:09 +0200299
Nicolas Pitre21666f12007-02-26 14:55:59 -0500300 if (type == OBJ_BLOB) {
Peter Eriksen8e440252006-04-02 14:44:09 +0200301 write_sha1_file(buffer, size, blob_type, entry->new_sha1);
Nicolas Pitre21666f12007-02-26 14:55:59 -0500302 } else if (type == OBJ_TREE)
Linus Torvaldsa44c9a52005-04-25 10:19:53 -0700303 convert_tree(buffer, size, entry->new_sha1);
Nicolas Pitre21666f12007-02-26 14:55:59 -0500304 else if (type == OBJ_COMMIT)
Linus Torvaldsa44c9a52005-04-25 10:19:53 -0700305 convert_commit(buffer, size, entry->new_sha1);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700306 else
Nicolas Pitre21666f12007-02-26 14:55:59 -0500307 die("unknown object type %d in %s", type, sha1_to_hex(sha1));
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700308 entry->converted = 1;
309 free(buffer);
Linus Torvalds4e813042005-07-27 15:29:38 -0700310 free(data);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700311 return entry;
312}
313
314int main(int argc, char **argv)
315{
316 unsigned char sha1[20];
317 struct entry *entry;
318
Junio C Hamano53228a52005-11-26 00:50:02 -0800319 setup_git_directory();
320
Dmitry V. Levin31fff302006-05-09 01:43:38 +0400321 if (argc != 2)
Junio C Hamano215a7ad2005-09-07 17:26:23 -0700322 usage("git-convert-objects <sha1>");
Dmitry V. Levin31fff302006-05-09 01:43:38 +0400323 if (get_sha1(argv[1], sha1))
324 die("Not a valid object name %s", argv[1]);
Linus Torvaldsd98b46f2005-04-20 01:10:46 -0700325
326 entry = convert_entry(sha1);
327 printf("new sha1: %s\n", sha1_to_hex(entry->new_sha1));
328 return 0;
329}