diff extra/fast-export/svn-fast-export.c @ 1544:e9e55585ebf2 feature_1136

Add fast-export
author Chris Cannam <chris.cannam@soundsoftware.ac.uk>
date Tue, 12 Jan 2016 13:39:30 +0000
parents
children
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/extra/fast-export/svn-fast-export.c	Tue Jan 12 13:39:30 2016 +0000
@@ -0,0 +1,187 @@
+/*
+ * svn-fast-export.c
+ * ----------
+ *  Walk through each revision of a local Subversion repository and export it
+ *  in a stream that git-fast-import can consume.
+ *
+ * Author: Chris Lee <clee@kde.org>
+ * License: MIT <http://www.opensource.org/licenses/mit-license.php>
+ */
+
+#define _XOPEN_SOURCE
+#include <unistd.h>
+#include <string.h>
+#include <stdio.h>
+#include <time.h>
+
+#ifndef PATH_MAX
+#define PATH_MAX 4096
+#endif
+
+#include <apr_lib.h>
+#include <apr_getopt.h>
+#include <apr_general.h>
+
+#include <svn_fs.h>
+#include <svn_repos.h>
+#include <svn_pools.h>
+#include <svn_types.h>
+
+#undef SVN_ERR
+#define SVN_ERR(expr) SVN_INT_ERR(expr)
+#define apr_sane_push(arr, contents) *(char **)apr_array_push(arr) = contents
+
+#define TRUNK "/trunk/"
+
+time_t get_epoch(char *svn_date)
+{
+    struct tm tm = {0};
+    char *date = malloc(strlen(svn_date) * sizeof(char *));
+    strncpy(date, svn_date, strlen(svn_date) - 8);
+    strptime(date, "%Y-%m-%dT%H:%M:%S", &tm);
+    free(date);
+    return mktime(&tm);
+}
+
+int dump_blob(svn_fs_root_t *root, char *full_path, apr_pool_t *pool)
+{
+    apr_size_t     len;
+    svn_stream_t   *stream, *outstream;
+    svn_filesize_t stream_length;
+
+    SVN_ERR(svn_fs_file_length(&stream_length, root, full_path, pool));
+    SVN_ERR(svn_fs_file_contents(&stream, root, full_path, pool));
+
+    fprintf(stdout, "data %lu\n", stream_length);
+    fflush(stdout);
+
+    SVN_ERR(svn_stream_for_stdout(&outstream, pool));
+    SVN_ERR(svn_stream_copy(stream, outstream, pool));
+
+    fprintf(stdout, "\n");
+    fflush(stdout);
+
+    return 0;
+}
+
+int export_revision(svn_revnum_t rev, svn_fs_t *fs, apr_pool_t *pool)
+{
+    unsigned int         mark;
+    const void           *key;
+    void                 *val;
+    char                 *path, *file_change;
+    apr_pool_t           *revpool;
+    apr_hash_t           *changes, *props;
+    apr_hash_index_t     *i;
+    apr_array_header_t   *file_changes;
+    svn_string_t         *author, *committer, *svndate, *svnlog;
+    svn_boolean_t        is_dir;
+    svn_fs_root_t        *fs_root;
+    svn_fs_path_change_t *change;
+
+    fprintf(stderr, "Exporting revision %ld... ", rev);
+
+    SVN_ERR(svn_fs_revision_root(&fs_root, fs, rev, pool));
+    SVN_ERR(svn_fs_paths_changed(&changes, fs_root, pool));
+    SVN_ERR(svn_fs_revision_proplist(&props, fs, rev, pool));
+
+    revpool = svn_pool_create(pool);
+
+    file_changes = apr_array_make(pool, apr_hash_count(changes), sizeof(char *));
+    mark = 1;
+    for (i = apr_hash_first(pool, changes); i; i = apr_hash_next(i)) {
+        svn_pool_clear(revpool);
+        apr_hash_this(i, &key, NULL, &val);
+        path = (char *)key;
+        change = (svn_fs_path_change_t *)val;
+
+        SVN_ERR(svn_fs_is_dir(&is_dir, fs_root, path, revpool));
+
+        if (is_dir || strncmp(TRUNK, path, strlen(TRUNK))) {
+            continue;
+        }
+
+        if (change->change_kind == svn_fs_path_change_delete) {
+            apr_sane_push(file_changes, (char *)svn_string_createf(pool, "D %s", path + strlen(TRUNK))->data);
+        } else {
+            apr_sane_push(file_changes, (char *)svn_string_createf(pool, "M 644 :%u %s", mark, path + strlen(TRUNK))->data);
+            fprintf(stdout, "blob\nmark :%u\n", mark++);
+            dump_blob(fs_root, (char *)path, revpool);
+        }
+    }
+
+    if (file_changes->nelts == 0) {
+        fprintf(stderr, "skipping.\n");
+        svn_pool_destroy(revpool);
+        return 0;
+    }
+
+    author = apr_hash_get(props, "svn:author", APR_HASH_KEY_STRING);
+    if (svn_string_isempty(author))
+        author = svn_string_create("nobody", pool);
+    svndate = apr_hash_get(props, "svn:date", APR_HASH_KEY_STRING);
+    svnlog = apr_hash_get(props, "svn:log", APR_HASH_KEY_STRING);
+
+    fprintf(stdout, "commit refs/heads/master\n");
+    fprintf(stdout, "committer %s <%s@localhost> %ld -0000\n", author->data, author->data, get_epoch((char *)svndate->data));
+    fprintf(stdout, "data %d\n", svnlog->len);
+    fputs(svnlog->data, stdout);
+    fprintf(stdout, "\n");
+    fputs(apr_array_pstrcat(pool, file_changes, '\n'), stdout);
+    fprintf(stdout, "\n\n");
+    fflush(stdout);
+
+    svn_pool_destroy(revpool);
+
+    fprintf(stderr, "done!\n");
+
+    return 0;
+}
+
+int crawl_revisions(char *repos_path)
+{
+    apr_pool_t   *pool, *subpool;
+    svn_fs_t     *fs;
+    svn_repos_t  *repos;
+    svn_revnum_t youngest_rev, min_rev, max_rev, rev;
+
+    pool = svn_pool_create(NULL);
+
+    SVN_ERR(svn_fs_initialize(pool));
+    SVN_ERR(svn_repos_open(&repos, repos_path, pool));
+    if ((fs = svn_repos_fs(repos)) == NULL)
+        return -1;
+    SVN_ERR(svn_fs_youngest_rev(&youngest_rev, fs, pool));
+
+    min_rev = 1;
+    max_rev = youngest_rev;
+
+    subpool = svn_pool_create(pool);
+    for (rev = min_rev; rev <= max_rev; rev++) {
+        svn_pool_clear(subpool);
+        export_revision(rev, fs, subpool);
+    }
+
+    svn_pool_destroy(pool);
+
+    return 0;
+}
+
+int main(int argc, char *argv[])
+{
+    if (argc != 2) {
+        fprintf(stderr, "usage: %s REPOS_PATH\n", argv[0]);
+        return -1;
+    }
+
+    if (apr_initialize() != APR_SUCCESS) {
+        fprintf(stderr, "You lose at apr_initialize().\n");
+        return -1;
+    }
+
+    crawl_revisions(argv[1]);
+
+    apr_terminate();
+
+    return 0;
+}