Merge branch 'en/simplify-check-updates-in-unpack-trees' into maint
[git] / t / helper / test-path-utils.c
1 #include "test-tool.h"
2 #include "cache.h"
3 #include "string-list.h"
4 #include "utf8.h"
5
6 /*
7  * A "string_list_each_func_t" function that normalizes an entry from
8  * GIT_CEILING_DIRECTORIES.  If the path is unusable for some reason,
9  * die with an explanation.
10  */
11 static int normalize_ceiling_entry(struct string_list_item *item, void *unused)
12 {
13         char *ceil = item->string;
14
15         if (!*ceil)
16                 die("Empty path is not supported");
17         if (!is_absolute_path(ceil))
18                 die("Path \"%s\" is not absolute", ceil);
19         if (normalize_path_copy(ceil, ceil) < 0)
20                 die("Path \"%s\" could not be normalized", ceil);
21         return 1;
22 }
23
24 static void normalize_argv_string(const char **var, const char *input)
25 {
26         if (!strcmp(input, "<null>"))
27                 *var = NULL;
28         else if (!strcmp(input, "<empty>"))
29                 *var = "";
30         else
31                 *var = input;
32
33         if (*var && (**var == '<' || **var == '('))
34                 die("Bad value: %s\n", input);
35 }
36
37 struct test_data {
38         const char *from;  /* input:  transform from this ... */
39         const char *to;    /* output: ... to this.            */
40         const char *alternative; /* output: ... or this.      */
41 };
42
43 /*
44  * Compatibility wrappers for OpenBSD, whose basename(3) and dirname(3)
45  * have const parameters.
46  */
47 static char *posix_basename(char *path)
48 {
49         return basename(path);
50 }
51
52 static char *posix_dirname(char *path)
53 {
54         return dirname(path);
55 }
56
57 static int test_function(struct test_data *data, char *(*func)(char *input),
58         const char *funcname)
59 {
60         int failed = 0, i;
61         char buffer[1024];
62         char *to;
63
64         for (i = 0; data[i].to; i++) {
65                 if (!data[i].from)
66                         to = func(NULL);
67                 else {
68                         xsnprintf(buffer, sizeof(buffer), "%s", data[i].from);
69                         to = func(buffer);
70                 }
71                 if (!strcmp(to, data[i].to))
72                         continue;
73                 if (!data[i].alternative)
74                         error("FAIL: %s(%s) => '%s' != '%s'\n",
75                                 funcname, data[i].from, to, data[i].to);
76                 else if (!strcmp(to, data[i].alternative))
77                         continue;
78                 else
79                         error("FAIL: %s(%s) => '%s' != '%s', '%s'\n",
80                                 funcname, data[i].from, to, data[i].to,
81                                 data[i].alternative);
82                 failed = 1;
83         }
84         return failed;
85 }
86
87 static struct test_data basename_data[] = {
88         /* --- POSIX type paths --- */
89         { NULL,              "."    },
90         { "",                "."    },
91         { ".",               "."    },
92         { "..",              ".."   },
93         { "/",               "/"    },
94         { "//",              "/", "//" },
95         { "///",             "/", "//" },
96         { "////",            "/", "//" },
97         { "usr",             "usr"  },
98         { "/usr",            "usr"  },
99         { "/usr/",           "usr"  },
100         { "/usr//",          "usr"  },
101         { "/usr/lib",        "lib"  },
102         { "usr/lib",         "lib"  },
103         { "usr/lib///",      "lib"  },
104
105 #if defined(__MINGW32__) || defined(_MSC_VER)
106         /* --- win32 type paths --- */
107         { "\\usr",           "usr"  },
108         { "\\usr\\",         "usr"  },
109         { "\\usr\\\\",       "usr"  },
110         { "\\usr\\lib",      "lib"  },
111         { "usr\\lib",        "lib"  },
112         { "usr\\lib\\\\\\",  "lib"  },
113         { "C:/usr",          "usr"  },
114         { "C:/usr",          "usr"  },
115         { "C:/usr/",         "usr"  },
116         { "C:/usr//",        "usr"  },
117         { "C:/usr/lib",      "lib"  },
118         { "C:usr/lib",       "lib"  },
119         { "C:usr/lib///",    "lib"  },
120         { "C:",              "."    },
121         { "C:a",             "a"    },
122         { "C:/",             "/"    },
123         { "C:///",           "/"    },
124         { "\\",              "\\", "/" },
125         { "\\\\",            "\\", "/" },
126         { "\\\\\\",          "\\", "/" },
127 #endif
128         { NULL,              NULL   }
129 };
130
131 static struct test_data dirname_data[] = {
132         /* --- POSIX type paths --- */
133         { NULL,              "."      },
134         { "",                "."      },
135         { ".",               "."      },
136         { "..",              "."      },
137         { "/",               "/"      },
138         { "//",              "/", "//" },
139         { "///",             "/", "//" },
140         { "////",            "/", "//" },
141         { "usr",             "."      },
142         { "/usr",            "/"      },
143         { "/usr/",           "/"      },
144         { "/usr//",          "/"      },
145         { "/usr/lib",        "/usr"   },
146         { "usr/lib",         "usr"    },
147         { "usr/lib///",      "usr"    },
148
149 #if defined(__MINGW32__) || defined(_MSC_VER)
150         /* --- win32 type paths --- */
151         { "\\",              "\\"     },
152         { "\\\\",            "\\\\"   },
153         { "\\usr",           "\\"     },
154         { "\\usr\\",         "\\"     },
155         { "\\usr\\\\",       "\\"     },
156         { "\\usr\\lib",      "\\usr"  },
157         { "usr\\lib",        "usr"    },
158         { "usr\\lib\\\\\\",  "usr"    },
159         { "C:a",             "C:."    },
160         { "C:/",             "C:/"    },
161         { "C:///",           "C:/"    },
162         { "C:/usr",          "C:/"    },
163         { "C:/usr/",         "C:/"    },
164         { "C:/usr//",        "C:/"    },
165         { "C:/usr/lib",      "C:/usr" },
166         { "C:usr/lib",       "C:usr"  },
167         { "C:usr/lib///",    "C:usr"  },
168         { "\\\\\\",          "\\"     },
169         { "\\\\\\\\",        "\\"     },
170         { "C:",              "C:.", "." },
171 #endif
172         { NULL,              NULL     }
173 };
174
175 static int is_dotgitmodules(const char *path)
176 {
177         return is_hfs_dotgitmodules(path) || is_ntfs_dotgitmodules(path);
178 }
179
180 static int cmp_by_st_size(const void *a, const void *b)
181 {
182         intptr_t x = (intptr_t)((struct string_list_item *)a)->util;
183         intptr_t y = (intptr_t)((struct string_list_item *)b)->util;
184
185         return x > y ? -1 : (x < y ? +1 : 0);
186 }
187
188 /*
189  * A very simple, reproducible pseudo-random generator. Copied from
190  * `test-genrandom.c`.
191  */
192 static uint64_t my_random_value = 1234;
193
194 static uint64_t my_random(void)
195 {
196         my_random_value = my_random_value * 1103515245 + 12345;
197         return my_random_value;
198 }
199
200 /*
201  * A fast approximation of the square root, without requiring math.h.
202  *
203  * It uses Newton's method to approximate the solution of 0 = x^2 - value.
204  */
205 static double my_sqrt(double value)
206 {
207         const double epsilon = 1e-6;
208         double x = value;
209
210         if (value == 0)
211                 return 0;
212
213         for (;;) {
214                 double delta = (value / x - x) / 2;
215                 if (delta < epsilon && delta > -epsilon)
216                         return x + delta;
217                 x += delta;
218         }
219 }
220
221 static int protect_ntfs_hfs_benchmark(int argc, const char **argv)
222 {
223         size_t i, j, nr, min_len = 3, max_len = 20;
224         char **names;
225         int repetitions = 15, file_mode = 0100644;
226         uint64_t begin, end;
227         double m[3][2], v[3][2];
228         uint64_t cumul;
229         double cumul2;
230
231         if (argc > 1 && !strcmp(argv[1], "--with-symlink-mode")) {
232                 file_mode = 0120000;
233                 argc--;
234                 argv++;
235         }
236
237         nr = argc > 1 ? strtoul(argv[1], NULL, 0) : 1000000;
238         ALLOC_ARRAY(names, nr);
239
240         if (argc > 2) {
241                 min_len = strtoul(argv[2], NULL, 0);
242                 if (argc > 3)
243                         max_len = strtoul(argv[3], NULL, 0);
244                 if (min_len > max_len)
245                         die("min_len > max_len");
246         }
247
248         for (i = 0; i < nr; i++) {
249                 size_t len = min_len + (my_random() % (max_len + 1 - min_len));
250
251                 names[i] = xmallocz(len);
252                 while (len > 0)
253                         names[i][--len] = (char)(' ' + (my_random() % ('\x7f' - ' ')));
254         }
255
256         for (protect_ntfs = 0; protect_ntfs < 2; protect_ntfs++)
257                 for (protect_hfs = 0; protect_hfs < 2; protect_hfs++) {
258                         cumul = 0;
259                         cumul2 = 0;
260                         for (i = 0; i < repetitions; i++) {
261                                 begin = getnanotime();
262                                 for (j = 0; j < nr; j++)
263                                         verify_path(names[j], file_mode);
264                                 end = getnanotime();
265                                 printf("protect_ntfs = %d, protect_hfs = %d: %lfms\n", protect_ntfs, protect_hfs, (end-begin) / (double)1e6);
266                                 cumul += end - begin;
267                                 cumul2 += (end - begin) * (end - begin);
268                         }
269                         m[protect_ntfs][protect_hfs] = cumul / (double)repetitions;
270                         v[protect_ntfs][protect_hfs] = my_sqrt(cumul2 / (double)repetitions - m[protect_ntfs][protect_hfs] * m[protect_ntfs][protect_hfs]);
271                         printf("mean: %lfms, stddev: %lfms\n", m[protect_ntfs][protect_hfs] / (double)1e6, v[protect_ntfs][protect_hfs] / (double)1e6);
272                 }
273
274         for (protect_ntfs = 0; protect_ntfs < 2; protect_ntfs++)
275                 for (protect_hfs = 0; protect_hfs < 2; protect_hfs++)
276                         printf("ntfs=%d/hfs=%d: %lf%% slower\n", protect_ntfs, protect_hfs, (m[protect_ntfs][protect_hfs] - m[0][0]) * 100 / m[0][0]);
277
278         return 0;
279 }
280
281 int cmd__path_utils(int argc, const char **argv)
282 {
283         if (argc == 3 && !strcmp(argv[1], "normalize_path_copy")) {
284                 char *buf = xmallocz(strlen(argv[2]));
285                 int rv = normalize_path_copy(buf, argv[2]);
286                 if (rv)
287                         buf = "++failed++";
288                 puts(buf);
289                 return 0;
290         }
291
292         if (argc >= 2 && !strcmp(argv[1], "real_path")) {
293                 while (argc > 2) {
294                         puts(real_path(argv[2]));
295                         argc--;
296                         argv++;
297                 }
298                 return 0;
299         }
300
301         if (argc >= 2 && !strcmp(argv[1], "absolute_path")) {
302                 while (argc > 2) {
303                         puts(absolute_path(argv[2]));
304                         argc--;
305                         argv++;
306                 }
307                 return 0;
308         }
309
310         if (argc == 4 && !strcmp(argv[1], "longest_ancestor_length")) {
311                 int len;
312                 struct string_list ceiling_dirs = STRING_LIST_INIT_DUP;
313                 char *path = xstrdup(argv[2]);
314
315                 /*
316                  * We have to normalize the arguments because under
317                  * Windows, bash mangles arguments that look like
318                  * absolute POSIX paths or colon-separate lists of
319                  * absolute POSIX paths into DOS paths (e.g.,
320                  * "/foo:/foo/bar" might be converted to
321                  * "D:\Src\msysgit\foo;D:\Src\msysgit\foo\bar"),
322                  * whereas longest_ancestor_length() requires paths
323                  * that use forward slashes.
324                  */
325                 if (normalize_path_copy(path, path))
326                         die("Path \"%s\" could not be normalized", argv[2]);
327                 string_list_split(&ceiling_dirs, argv[3], PATH_SEP, -1);
328                 filter_string_list(&ceiling_dirs, 0,
329                                    normalize_ceiling_entry, NULL);
330                 len = longest_ancestor_length(path, &ceiling_dirs);
331                 string_list_clear(&ceiling_dirs, 0);
332                 free(path);
333                 printf("%d\n", len);
334                 return 0;
335         }
336
337         if (argc >= 4 && !strcmp(argv[1], "prefix_path")) {
338                 const char *prefix = argv[2];
339                 int prefix_len = strlen(prefix);
340                 int nongit_ok;
341                 setup_git_directory_gently(&nongit_ok);
342                 while (argc > 3) {
343                         puts(prefix_path(prefix, prefix_len, argv[3]));
344                         argc--;
345                         argv++;
346                 }
347                 return 0;
348         }
349
350         if (argc == 4 && !strcmp(argv[1], "strip_path_suffix")) {
351                 char *prefix = strip_path_suffix(argv[2], argv[3]);
352                 printf("%s\n", prefix ? prefix : "(null)");
353                 return 0;
354         }
355
356         if (argc == 3 && !strcmp(argv[1], "print_path")) {
357                 puts(argv[2]);
358                 return 0;
359         }
360
361         if (argc == 4 && !strcmp(argv[1], "relative_path")) {
362                 struct strbuf sb = STRBUF_INIT;
363                 const char *in, *prefix, *rel;
364                 normalize_argv_string(&in, argv[2]);
365                 normalize_argv_string(&prefix, argv[3]);
366                 rel = relative_path(in, prefix, &sb);
367                 if (!rel)
368                         puts("(null)");
369                 else
370                         puts(strlen(rel) > 0 ? rel : "(empty)");
371                 strbuf_release(&sb);
372                 return 0;
373         }
374
375         if (argc == 2 && !strcmp(argv[1], "basename"))
376                 return test_function(basename_data, posix_basename, argv[1]);
377
378         if (argc == 2 && !strcmp(argv[1], "dirname"))
379                 return test_function(dirname_data, posix_dirname, argv[1]);
380
381         if (argc > 2 && !strcmp(argv[1], "is_dotgitmodules")) {
382                 int res = 0, expect = 1, i;
383                 for (i = 2; i < argc; i++)
384                         if (!strcmp("--not", argv[i]))
385                                 expect = !expect;
386                         else if (expect != is_dotgitmodules(argv[i]))
387                                 res = error("'%s' is %s.gitmodules", argv[i],
388                                             expect ? "not " : "");
389                         else
390                                 fprintf(stderr, "ok: '%s' is %s.gitmodules\n",
391                                         argv[i], expect ? "" : "not ");
392                 return !!res;
393         }
394
395         if (argc > 2 && !strcmp(argv[1], "file-size")) {
396                 int res = 0, i;
397                 struct stat st;
398
399                 for (i = 2; i < argc; i++)
400                         if (stat(argv[i], &st))
401                                 res = error_errno("Cannot stat '%s'", argv[i]);
402                         else
403                                 printf("%"PRIuMAX"\n", (uintmax_t)st.st_size);
404                 return !!res;
405         }
406
407         if (argc == 4 && !strcmp(argv[1], "skip-n-bytes")) {
408                 int fd = open(argv[2], O_RDONLY), offset = atoi(argv[3]);
409                 char buffer[65536];
410
411                 if (fd < 0)
412                         die_errno("could not open '%s'", argv[2]);
413                 if (lseek(fd, offset, SEEK_SET) < 0)
414                         die_errno("could not skip %d bytes", offset);
415                 for (;;) {
416                         ssize_t count = read(fd, buffer, sizeof(buffer));
417                         if (count < 0)
418                                 die_errno("could not read '%s'", argv[2]);
419                         if (!count)
420                                 break;
421                         if (write(1, buffer, count) < 0)
422                                 die_errno("could not write to stdout");
423                 }
424                 close(fd);
425                 return 0;
426         }
427
428         if (argc > 5 && !strcmp(argv[1], "slice-tests")) {
429                 int res = 0;
430                 long offset, stride, i;
431                 struct string_list list = STRING_LIST_INIT_NODUP;
432                 struct stat st;
433
434                 offset = strtol(argv[2], NULL, 10);
435                 stride = strtol(argv[3], NULL, 10);
436                 if (stride < 1)
437                         stride = 1;
438                 for (i = 4; i < argc; i++)
439                         if (stat(argv[i], &st))
440                                 res = error_errno("Cannot stat '%s'", argv[i]);
441                         else
442                                 string_list_append(&list, argv[i])->util =
443                                         (void *)(intptr_t)st.st_size;
444                 QSORT(list.items, list.nr, cmp_by_st_size);
445                 for (i = offset; i < list.nr; i+= stride)
446                         printf("%s\n", list.items[i].string);
447
448                 return !!res;
449         }
450
451         if (argc > 1 && !strcmp(argv[1], "protect_ntfs_hfs"))
452                 return !!protect_ntfs_hfs_benchmark(argc - 1, argv + 1);
453
454         if (argc > 1 && !strcmp(argv[1], "is_valid_path")) {
455                 int res = 0, expect = 1, i;
456
457                 for (i = 2; i < argc; i++)
458                         if (!strcmp("--not", argv[i]))
459                                 expect = 0;
460                         else if (expect != is_valid_path(argv[i]))
461                                 res = error("'%s' is%s a valid path",
462                                             argv[i], expect ? " not" : "");
463                         else
464                                 fprintf(stderr,
465                                         "'%s' is%s a valid path\n",
466                                         argv[i], expect ? "" : " not");
467
468                 return !!res;
469         }
470
471         fprintf(stderr, "%s: unknown function name: %s\n", argv[0],
472                 argv[1] ? argv[1] : "(there was none)");
473         return 1;
474 }